mirror of
https://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
synced 2026-02-17 00:46:26 -05:00
drm/xe: Use the vma attibute drm_pagemap to select where to migrate
Honor the drm_pagemap vma attribute when migrating SVM pages. Ensure that when the desired placement is validated as device memory, that we also check that the requested drm_pagemap is consistent with the current. v2: - Initialize a struct drm_pagemap pointer to NULL that could otherwise be dereferenced uninitialized. (CI) - Remove a redundant assignment (Matt Brost) - Slightly improved commit message (Matt Brost) - Extended drm_pagemap validation. v3: - Fix a compilation error if CONFIG_DRM_GPUSVM is not enabled. (kernel test robot <lkp@intel.com>) Signed-off-by: Thomas Hellström <thomas.hellstrom@linux.intel.com> Reviewed-by: Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com> Link: https://patch.msgid.link/20251219113320.183860-14-thomas.hellstrom@linux.intel.com
This commit is contained in:
@@ -887,13 +887,34 @@ void xe_svm_fini(struct xe_vm *vm)
|
||||
drm_gpusvm_fini(&vm->svm.gpusvm);
|
||||
}
|
||||
|
||||
static bool xe_svm_range_has_pagemap_locked(const struct xe_svm_range *range,
|
||||
const struct drm_pagemap *dpagemap)
|
||||
{
|
||||
return range->base.pages.dpagemap == dpagemap;
|
||||
}
|
||||
|
||||
static bool xe_svm_range_has_pagemap(struct xe_svm_range *range,
|
||||
const struct drm_pagemap *dpagemap)
|
||||
{
|
||||
struct xe_vm *vm = range_to_vm(&range->base);
|
||||
bool ret;
|
||||
|
||||
xe_svm_notifier_lock(vm);
|
||||
ret = xe_svm_range_has_pagemap_locked(range, dpagemap);
|
||||
xe_svm_notifier_unlock(vm);
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
static bool xe_svm_range_is_valid(struct xe_svm_range *range,
|
||||
struct xe_tile *tile,
|
||||
bool devmem_only)
|
||||
bool devmem_only,
|
||||
const struct drm_pagemap *dpagemap)
|
||||
|
||||
{
|
||||
return (xe_vm_has_valid_gpu_mapping(tile, range->tile_present,
|
||||
range->tile_invalidated) &&
|
||||
(!devmem_only || xe_svm_range_in_vram(range)));
|
||||
(!devmem_only || xe_svm_range_has_pagemap(range, dpagemap)));
|
||||
}
|
||||
|
||||
/** xe_svm_range_migrate_to_smem() - Move range pages from VRAM to SMEM
|
||||
@@ -914,7 +935,8 @@ void xe_svm_range_migrate_to_smem(struct xe_vm *vm, struct xe_svm_range *range)
|
||||
* @vm: xe_vm pointer
|
||||
* @range: Pointer to the SVM range structure
|
||||
* @tile_mask: Mask representing the tiles to be checked
|
||||
* @devmem_preferred : if true range needs to be in devmem
|
||||
* @dpagemap: if !%NULL, the range is expected to be present
|
||||
* in device memory identified by this parameter.
|
||||
*
|
||||
* The xe_svm_range_validate() function checks if a range is
|
||||
* valid and located in the desired memory region.
|
||||
@@ -923,14 +945,15 @@ void xe_svm_range_migrate_to_smem(struct xe_vm *vm, struct xe_svm_range *range)
|
||||
*/
|
||||
bool xe_svm_range_validate(struct xe_vm *vm,
|
||||
struct xe_svm_range *range,
|
||||
u8 tile_mask, bool devmem_preferred)
|
||||
u8 tile_mask, const struct drm_pagemap *dpagemap)
|
||||
{
|
||||
bool ret;
|
||||
|
||||
xe_svm_notifier_lock(vm);
|
||||
|
||||
ret = (range->tile_present & ~range->tile_invalidated & tile_mask) == tile_mask &&
|
||||
(devmem_preferred == range->base.pages.flags.has_devmem_pages);
|
||||
ret = (range->tile_present & ~range->tile_invalidated & tile_mask) == tile_mask;
|
||||
if (dpagemap)
|
||||
ret = ret && xe_svm_range_has_pagemap_locked(range, dpagemap);
|
||||
|
||||
xe_svm_notifier_unlock(vm);
|
||||
|
||||
@@ -1044,22 +1067,22 @@ static bool supports_4K_migration(struct xe_device *xe)
|
||||
* xe_svm_range_needs_migrate_to_vram() - SVM range needs migrate to VRAM or not
|
||||
* @range: SVM range for which migration needs to be decided
|
||||
* @vma: vma which has range
|
||||
* @preferred_region_is_vram: preferred region for range is vram
|
||||
* @dpagemap: The preferred struct drm_pagemap to migrate to.
|
||||
*
|
||||
* Return: True for range needing migration and migration is supported else false
|
||||
*/
|
||||
bool xe_svm_range_needs_migrate_to_vram(struct xe_svm_range *range, struct xe_vma *vma,
|
||||
bool preferred_region_is_vram)
|
||||
const struct drm_pagemap *dpagemap)
|
||||
{
|
||||
struct xe_vm *vm = range_to_vm(&range->base);
|
||||
u64 range_size = xe_svm_range_size(range);
|
||||
|
||||
if (!range->base.pages.flags.migrate_devmem || !preferred_region_is_vram)
|
||||
if (!range->base.pages.flags.migrate_devmem || !dpagemap)
|
||||
return false;
|
||||
|
||||
xe_assert(vm->xe, IS_DGFX(vm->xe));
|
||||
|
||||
if (xe_svm_range_in_vram(range)) {
|
||||
if (xe_svm_range_has_pagemap(range, dpagemap)) {
|
||||
drm_dbg(&vm->xe->drm, "Range is already in VRAM\n");
|
||||
return false;
|
||||
}
|
||||
@@ -1156,9 +1179,9 @@ static int __xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
|
||||
if (err)
|
||||
return err;
|
||||
|
||||
dpagemap = xe_vma_resolve_pagemap(vma, tile);
|
||||
ctx.device_private_page_owner =
|
||||
xe_svm_private_page_owner(vm, !dpagemap && !ctx.devmem_only);
|
||||
dpagemap = ctx.devmem_only ? xe_tile_local_pagemap(tile) :
|
||||
xe_vma_resolve_pagemap(vma, tile);
|
||||
ctx.device_private_page_owner = xe_svm_private_page_owner(vm, !dpagemap);
|
||||
range = xe_svm_range_find_or_insert(vm, fault_addr, vma, &ctx);
|
||||
|
||||
if (IS_ERR(range))
|
||||
@@ -1171,7 +1194,7 @@ static int __xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
|
||||
goto out;
|
||||
}
|
||||
|
||||
if (xe_svm_range_is_valid(range, tile, ctx.devmem_only)) {
|
||||
if (xe_svm_range_is_valid(range, tile, ctx.devmem_only, dpagemap)) {
|
||||
xe_svm_range_valid_fault_count_stats_incr(gt, range);
|
||||
range_debug(range, "PAGE FAULT - VALID");
|
||||
goto out;
|
||||
@@ -1180,16 +1203,11 @@ static int __xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
|
||||
range_debug(range, "PAGE FAULT");
|
||||
|
||||
if (--migrate_try_count >= 0 &&
|
||||
xe_svm_range_needs_migrate_to_vram(range, vma, !!dpagemap || ctx.devmem_only)) {
|
||||
xe_svm_range_needs_migrate_to_vram(range, vma, dpagemap)) {
|
||||
ktime_t migrate_start = xe_gt_stats_ktime_get();
|
||||
|
||||
/* TODO : For multi-device dpagemap will be used to find the
|
||||
* remote tile and remote device. Will need to modify
|
||||
* xe_svm_alloc_vram to use dpagemap for future multi-device
|
||||
* support.
|
||||
*/
|
||||
xe_svm_range_migrate_count_stats_incr(gt, range);
|
||||
err = xe_svm_alloc_vram(tile, range, &ctx);
|
||||
err = xe_svm_alloc_vram(range, &ctx, dpagemap);
|
||||
xe_svm_range_migrate_us_stats_incr(gt, range, migrate_start);
|
||||
ctx.timeslice_ms <<= 1; /* Double timeslice if we have to retry */
|
||||
if (err) {
|
||||
@@ -1506,7 +1524,13 @@ u8 xe_svm_ranges_zap_ptes_in_range(struct xe_vm *vm, u64 start, u64 end)
|
||||
*/
|
||||
struct drm_pagemap *xe_vma_resolve_pagemap(struct xe_vma *vma, struct xe_tile *tile)
|
||||
{
|
||||
s32 fd = (s32)vma->attr.preferred_loc.devmem_fd;
|
||||
struct drm_pagemap *dpagemap = vma->attr.preferred_loc.dpagemap;
|
||||
s32 fd;
|
||||
|
||||
if (dpagemap)
|
||||
return dpagemap;
|
||||
|
||||
fd = (s32)vma->attr.preferred_loc.devmem_fd;
|
||||
|
||||
if (fd == DRM_XE_PREFERRED_LOC_DEFAULT_SYSTEM)
|
||||
return NULL;
|
||||
@@ -1514,28 +1538,24 @@ struct drm_pagemap *xe_vma_resolve_pagemap(struct xe_vma *vma, struct xe_tile *t
|
||||
if (fd == DRM_XE_PREFERRED_LOC_DEFAULT_DEVICE)
|
||||
return IS_DGFX(tile_to_xe(tile)) ? xe_tile_local_pagemap(tile) : NULL;
|
||||
|
||||
/* TODO: Support multi-device with drm_pagemap_from_fd(fd) */
|
||||
return NULL;
|
||||
}
|
||||
|
||||
/**
|
||||
* xe_svm_alloc_vram()- Allocate device memory pages for range,
|
||||
* migrating existing data.
|
||||
* @tile: tile to allocate vram from
|
||||
* @range: SVM range
|
||||
* @ctx: DRM GPU SVM context
|
||||
* @dpagemap: The struct drm_pagemap representing the memory to allocate.
|
||||
*
|
||||
* Return: 0 on success, error code on failure.
|
||||
*/
|
||||
int xe_svm_alloc_vram(struct xe_tile *tile, struct xe_svm_range *range,
|
||||
const struct drm_gpusvm_ctx *ctx)
|
||||
int xe_svm_alloc_vram(struct xe_svm_range *range, const struct drm_gpusvm_ctx *ctx,
|
||||
struct drm_pagemap *dpagemap)
|
||||
{
|
||||
struct drm_pagemap *dpagemap;
|
||||
|
||||
xe_assert(tile_to_xe(tile), range->base.pages.flags.migrate_devmem);
|
||||
xe_assert(range_to_vm(&range->base)->xe, range->base.pages.flags.migrate_devmem);
|
||||
range_debug(range, "ALLOCATE VRAM");
|
||||
|
||||
dpagemap = xe_tile_local_pagemap(tile);
|
||||
return drm_pagemap_populate_mm(dpagemap, xe_svm_range_start(range),
|
||||
xe_svm_range_end(range),
|
||||
range->base.gpusvm->mm,
|
||||
@@ -1805,9 +1825,9 @@ int xe_pagemap_cache_create(struct xe_tile *tile)
|
||||
return 0;
|
||||
}
|
||||
|
||||
int xe_svm_alloc_vram(struct xe_tile *tile,
|
||||
struct xe_svm_range *range,
|
||||
const struct drm_gpusvm_ctx *ctx)
|
||||
int xe_svm_alloc_vram(struct xe_svm_range *range,
|
||||
const struct drm_gpusvm_ctx *ctx,
|
||||
struct drm_pagemap *dpagemap)
|
||||
{
|
||||
return -EOPNOTSUPP;
|
||||
}
|
||||
|
||||
@@ -94,8 +94,8 @@ int xe_svm_bo_evict(struct xe_bo *bo);
|
||||
|
||||
void xe_svm_range_debug(struct xe_svm_range *range, const char *operation);
|
||||
|
||||
int xe_svm_alloc_vram(struct xe_tile *tile, struct xe_svm_range *range,
|
||||
const struct drm_gpusvm_ctx *ctx);
|
||||
int xe_svm_alloc_vram(struct xe_svm_range *range, const struct drm_gpusvm_ctx *ctx,
|
||||
struct drm_pagemap *dpagemap);
|
||||
|
||||
struct xe_svm_range *xe_svm_range_find_or_insert(struct xe_vm *vm, u64 addr,
|
||||
struct xe_vma *vma, struct drm_gpusvm_ctx *ctx);
|
||||
@@ -104,13 +104,13 @@ int xe_svm_range_get_pages(struct xe_vm *vm, struct xe_svm_range *range,
|
||||
struct drm_gpusvm_ctx *ctx);
|
||||
|
||||
bool xe_svm_range_needs_migrate_to_vram(struct xe_svm_range *range, struct xe_vma *vma,
|
||||
bool preferred_region_is_vram);
|
||||
const struct drm_pagemap *dpagemap);
|
||||
|
||||
void xe_svm_range_migrate_to_smem(struct xe_vm *vm, struct xe_svm_range *range);
|
||||
|
||||
bool xe_svm_range_validate(struct xe_vm *vm,
|
||||
struct xe_svm_range *range,
|
||||
u8 tile_mask, bool devmem_preferred);
|
||||
u8 tile_mask, const struct drm_pagemap *dpagemap);
|
||||
|
||||
u64 xe_svm_find_vma_start(struct xe_vm *vm, u64 addr, u64 end, struct xe_vma *vma);
|
||||
|
||||
@@ -276,8 +276,8 @@ void xe_svm_range_debug(struct xe_svm_range *range, const char *operation)
|
||||
}
|
||||
|
||||
static inline int
|
||||
xe_svm_alloc_vram(struct xe_tile *tile, struct xe_svm_range *range,
|
||||
const struct drm_gpusvm_ctx *ctx)
|
||||
xe_svm_alloc_vram(struct xe_svm_range *range, const struct drm_gpusvm_ctx *ctx,
|
||||
struct drm_pagemap *dpagemap)
|
||||
{
|
||||
return -EOPNOTSUPP;
|
||||
}
|
||||
@@ -318,7 +318,7 @@ static inline unsigned long xe_svm_range_size(struct xe_svm_range *range)
|
||||
|
||||
static inline
|
||||
bool xe_svm_range_needs_migrate_to_vram(struct xe_svm_range *range, struct xe_vma *vma,
|
||||
u32 region)
|
||||
const struct drm_pagemap *dpagemap)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
@@ -2342,7 +2342,7 @@ vm_bind_ioctl_ops_create(struct xe_vm *vm, struct xe_vma_ops *vops,
|
||||
struct xe_tile *tile;
|
||||
struct xe_svm_range *svm_range;
|
||||
struct drm_gpusvm_ctx ctx = {};
|
||||
struct drm_pagemap *dpagemap;
|
||||
struct drm_pagemap *dpagemap = NULL;
|
||||
u8 id, tile_mask = 0;
|
||||
u32 i;
|
||||
|
||||
@@ -2360,23 +2360,17 @@ vm_bind_ioctl_ops_create(struct xe_vm *vm, struct xe_vma_ops *vops,
|
||||
|
||||
xa_init_flags(&op->prefetch_range.range, XA_FLAGS_ALLOC);
|
||||
op->prefetch_range.ranges_count = 0;
|
||||
tile = NULL;
|
||||
|
||||
if (prefetch_region == DRM_XE_CONSULT_MEM_ADVISE_PREF_LOC) {
|
||||
dpagemap = xe_vma_resolve_pagemap(vma,
|
||||
xe_device_get_root_tile(vm->xe));
|
||||
/*
|
||||
* TODO: Once multigpu support is enabled will need
|
||||
* something to dereference tile from dpagemap.
|
||||
*/
|
||||
if (dpagemap)
|
||||
tile = xe_device_get_root_tile(vm->xe);
|
||||
} else if (prefetch_region) {
|
||||
tile = &vm->xe->tiles[region_to_mem_type[prefetch_region] -
|
||||
XE_PL_VRAM0];
|
||||
dpagemap = xe_tile_local_pagemap(tile);
|
||||
}
|
||||
|
||||
op->prefetch_range.tile = tile;
|
||||
op->prefetch_range.dpagemap = dpagemap;
|
||||
alloc_next_range:
|
||||
svm_range = xe_svm_range_find_or_insert(vm, addr, vma, &ctx);
|
||||
|
||||
@@ -2395,7 +2389,7 @@ vm_bind_ioctl_ops_create(struct xe_vm *vm, struct xe_vma_ops *vops,
|
||||
goto unwind_prefetch_ops;
|
||||
}
|
||||
|
||||
if (xe_svm_range_validate(vm, svm_range, tile_mask, !!tile)) {
|
||||
if (xe_svm_range_validate(vm, svm_range, tile_mask, dpagemap)) {
|
||||
xe_svm_range_debug(svm_range, "PREFETCH - RANGE IS VALID");
|
||||
goto check_next_range;
|
||||
}
|
||||
@@ -2917,7 +2911,7 @@ static int prefetch_ranges(struct xe_vm *vm, struct xe_vma_op *op)
|
||||
{
|
||||
bool devmem_possible = IS_DGFX(vm->xe) && IS_ENABLED(CONFIG_DRM_XE_PAGEMAP);
|
||||
struct xe_vma *vma = gpuva_to_vma(op->base.prefetch.va);
|
||||
struct xe_tile *tile = op->prefetch_range.tile;
|
||||
struct drm_pagemap *dpagemap = op->prefetch_range.dpagemap;
|
||||
int err = 0;
|
||||
|
||||
struct xe_svm_range *svm_range;
|
||||
@@ -2930,15 +2924,15 @@ static int prefetch_ranges(struct xe_vm *vm, struct xe_vma_op *op)
|
||||
ctx.read_only = xe_vma_read_only(vma);
|
||||
ctx.devmem_possible = devmem_possible;
|
||||
ctx.check_pages_threshold = devmem_possible ? SZ_64K : 0;
|
||||
ctx.device_private_page_owner = xe_svm_private_page_owner(vm, !tile);
|
||||
ctx.device_private_page_owner = xe_svm_private_page_owner(vm, !dpagemap);
|
||||
|
||||
/* TODO: Threading the migration */
|
||||
xa_for_each(&op->prefetch_range.range, i, svm_range) {
|
||||
if (!tile)
|
||||
if (!dpagemap)
|
||||
xe_svm_range_migrate_to_smem(vm, svm_range);
|
||||
|
||||
if (xe_svm_range_needs_migrate_to_vram(svm_range, vma, !!tile)) {
|
||||
err = xe_svm_alloc_vram(tile, svm_range, &ctx);
|
||||
if (xe_svm_range_needs_migrate_to_vram(svm_range, vma, dpagemap)) {
|
||||
err = xe_svm_alloc_vram(svm_range, &ctx, dpagemap);
|
||||
if (err) {
|
||||
drm_dbg(&vm->xe->drm, "VRAM allocation failed, retry from userspace, asid=%u, gpusvm=%p, errno=%pe\n",
|
||||
vm->usm.asid, &vm->svm.gpusvm, ERR_PTR(err));
|
||||
|
||||
@@ -408,10 +408,10 @@ struct xe_vma_op_prefetch_range {
|
||||
/** @ranges_count: number of svm ranges to map */
|
||||
u32 ranges_count;
|
||||
/**
|
||||
* @tile: Pointer to the tile structure containing memory to prefetch.
|
||||
* NULL if prefetch requested region is smem
|
||||
* @dpagemap: Pointer to the dpagemap structure containing memory to prefetch.
|
||||
* NULL if prefetch requested region is smem
|
||||
*/
|
||||
struct xe_tile *tile;
|
||||
struct drm_pagemap *dpagemap;
|
||||
};
|
||||
|
||||
/** enum xe_vma_op_flags - flags for VMA operation */
|
||||
|
||||
Reference in New Issue
Block a user