Commit b5870168 authored by Thomas Hellström's avatar Thomas Hellström
Browse files

drm/xe: Implement and use the drm_pagemap populate_mm op



Add runtime PM since we might call populate_mm on a foreign device.

v3:
- Fix a kerneldoc failure (Matt Brost)
- Revert the bo type change from device to kernel (Matt Brost)
v4:
- Add an assert in xe_svm_alloc_vram (Matt Brost)

Signed-off-by: default avatarThomas Hellström <thomas.hellstrom@linux.intel.com>
Reviewed-by: default avatarMatthew Brost <matthew.brost@intel.com>
Link: https://lore.kernel.org/r/20250619134035.170086-4-thomas.hellstrom@linux.intel.com
parent 2ef19be2
Loading
Loading
Loading
Loading
+1 −0
Original line number Diff line number Diff line
@@ -835,3 +835,4 @@ int drm_pagemap_populate_mm(struct drm_pagemap *dpagemap,

	return err;
}
EXPORT_SYMBOL(drm_pagemap_populate_mm);
+60 −42
Original line number Diff line number Diff line
@@ -3,13 +3,17 @@
 * Copyright © 2024 Intel Corporation
 */

#include <drm/drm_drv.h>

#include "xe_bo.h"
#include "xe_gt_stats.h"
#include "xe_gt_tlb_invalidation.h"
#include "xe_migrate.h"
#include "xe_module.h"
#include "xe_pm.h"
#include "xe_pt.h"
#include "xe_svm.h"
#include "xe_tile.h"
#include "xe_ttm_vram_mgr.h"
#include "xe_vm.h"
#include "xe_vm_types.h"
@@ -491,8 +495,10 @@ static struct xe_bo *to_xe_bo(struct drm_pagemap_devmem *devmem_allocation)
static void xe_svm_devmem_release(struct drm_pagemap_devmem *devmem_allocation)
{
	struct xe_bo *bo = to_xe_bo(devmem_allocation);
	struct xe_device *xe = xe_bo_device(bo);

	xe_bo_put_async(bo);
	xe_pm_runtime_put(xe);
}

static u64 block_offset_to_pfn(struct xe_vram_region *vr, u64 offset)
@@ -682,76 +688,63 @@ static struct xe_vram_region *tile_to_vr(struct xe_tile *tile)
	return &tile->mem.vram;
}

/**
 * xe_svm_alloc_vram()- Allocate device memory pages for range,
 * migrating existing data.
 * @vm: The VM.
 * @tile: tile to allocate vram from
 * @range: SVM range
 * @ctx: DRM GPU SVM context
 *
 * Return: 0 on success, error code on failure.
 */
int xe_svm_alloc_vram(struct xe_vm *vm, struct xe_tile *tile,
		      struct xe_svm_range *range,
		      const struct drm_gpusvm_ctx *ctx)
static int xe_drm_pagemap_populate_mm(struct drm_pagemap *dpagemap,
				      unsigned long start, unsigned long end,
				      struct mm_struct *mm,
				      unsigned long timeslice_ms)
{
	struct mm_struct *mm = vm->svm.gpusvm.mm;
	struct xe_tile *tile = container_of(dpagemap, typeof(*tile), mem.vram.dpagemap);
	struct xe_device *xe = tile_to_xe(tile);
	struct device *dev = xe->drm.dev;
	struct xe_vram_region *vr = tile_to_vr(tile);
	struct drm_buddy_block *block;
	struct list_head *blocks;
	struct xe_bo *bo;
	ktime_t end = 0;
	int err;

	if (!range->base.flags.migrate_devmem)
		return -EINVAL;
	ktime_t time_end = 0;
	int err, idx;

	range_debug(range, "ALLOCATE VRAM");
	if (!drm_dev_enter(&xe->drm, &idx))
		return -ENODEV;

	if (!mmget_not_zero(mm))
		return -EFAULT;
	mmap_read_lock(mm);
	xe_pm_runtime_get(xe);

 retry:
	bo = xe_bo_create_locked(tile_to_xe(tile), NULL, NULL,
				 xe_svm_range_size(range),
	bo = xe_bo_create_locked(tile_to_xe(tile), NULL, NULL, end - start,
				 ttm_bo_type_device,
				 XE_BO_FLAG_VRAM_IF_DGFX(tile) |
				 XE_BO_FLAG_CPU_ADDR_MIRROR);
	if (IS_ERR(bo)) {
		err = PTR_ERR(bo);
		if (xe_vm_validate_should_retry(NULL, err, &end))
		if (xe_vm_validate_should_retry(NULL, err, &time_end))
			goto retry;
		goto unlock;
		goto out_pm_put;
	}

	drm_pagemap_devmem_init(&bo->devmem_allocation,
				vm->xe->drm.dev, mm,
	drm_pagemap_devmem_init(&bo->devmem_allocation, dev, mm,
				&dpagemap_devmem_ops,
				&tile->mem.vram.dpagemap,
				xe_svm_range_size(range));
				end - start);

	blocks = &to_xe_ttm_vram_mgr_resource(bo->ttm.resource)->blocks;
	list_for_each_entry(block, blocks, link)
		block->private = vr;

	xe_bo_get(bo);
	err = drm_pagemap_migrate_to_devmem(&bo->devmem_allocation,
					    mm,
					    xe_svm_range_start(range),
					    xe_svm_range_end(range),
					    ctx->timeslice_ms,
					    xe_svm_devm_owner(vm->xe));

	/* Ensure the device has a pm ref while there are device pages active. */
	xe_pm_runtime_get_noresume(xe);
	err = drm_pagemap_migrate_to_devmem(&bo->devmem_allocation, mm,
					    start, end, timeslice_ms,
					    xe_svm_devm_owner(xe));
	if (err)
		xe_svm_devmem_release(&bo->devmem_allocation);

	xe_bo_unlock(bo);
	xe_bo_put(bo);

unlock:
	mmap_read_unlock(mm);
	mmput(mm);
out_pm_put:
	xe_pm_runtime_put(xe);
	drm_dev_exit(idx);

	return err;
}
@@ -859,7 +852,7 @@ int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,

	if (--migrate_try_count >= 0 &&
	    xe_svm_range_needs_migrate_to_vram(range, vma, IS_DGFX(vm->xe))) {
		err = xe_svm_alloc_vram(vm, tile, range, &ctx);
		err = xe_svm_alloc_vram(tile, range, &ctx);
		ctx.timeslice_ms <<= 1;	/* Double timeslice if we have to retry */
		if (err) {
			if (migrate_try_count || !ctx.devmem_only) {
@@ -1006,6 +999,30 @@ int xe_svm_range_get_pages(struct xe_vm *vm, struct xe_svm_range *range,

#if IS_ENABLED(CONFIG_DRM_XE_PAGEMAP)

/**
 * xe_svm_alloc_vram()- Allocate device memory pages for range,
 * migrating existing data.
 * @tile: tile to allocate vram from
 * @range: SVM range
 * @ctx: DRM GPU SVM context
 *
 * Return: 0 on success, error code on failure.
 */
int xe_svm_alloc_vram(struct xe_tile *tile, struct xe_svm_range *range,
		      const struct drm_gpusvm_ctx *ctx)
{
	struct drm_pagemap *dpagemap;

	xe_assert(tile_to_xe(tile), range->base.flags.migrate_devmem);
	range_debug(range, "ALLOCATE VRAM");

	dpagemap = xe_tile_local_pagemap(tile);
	return drm_pagemap_populate_mm(dpagemap, xe_svm_range_start(range),
				       xe_svm_range_end(range),
				       range->base.gpusvm->mm,
				       ctx->timeslice_ms);
}

static struct drm_pagemap_device_addr
xe_drm_pagemap_device_map(struct drm_pagemap *dpagemap,
			  struct device *dev,
@@ -1030,6 +1047,7 @@ xe_drm_pagemap_device_map(struct drm_pagemap *dpagemap,

static const struct drm_pagemap_ops xe_drm_pagemap_ops = {
	.device_map = xe_drm_pagemap_device_map,
	.populate_mm = xe_drm_pagemap_populate_mm,
};

/**
@@ -1082,7 +1100,7 @@ int xe_devm_add(struct xe_tile *tile, struct xe_vram_region *vr)
	return 0;
}
#else
int xe_svm_alloc_vram(struct xe_vm *vm, struct xe_tile *tile,
int xe_svm_alloc_vram(struct xe_tile *tile,
		      struct xe_svm_range *range,
		      const struct drm_gpusvm_ctx *ctx)
{
+4 −6
Original line number Diff line number Diff line
@@ -70,8 +70,7 @@ int xe_svm_bo_evict(struct xe_bo *bo);

void xe_svm_range_debug(struct xe_svm_range *range, const char *operation);

int xe_svm_alloc_vram(struct xe_vm *vm, struct xe_tile *tile,
		      struct xe_svm_range *range,
int xe_svm_alloc_vram(struct xe_tile *tile, struct xe_svm_range *range,
		      const struct drm_gpusvm_ctx *ctx);

struct xe_svm_range *xe_svm_range_find_or_insert(struct xe_vm *vm, u64 addr,
@@ -237,9 +236,8 @@ void xe_svm_range_debug(struct xe_svm_range *range, const char *operation)
{
}

static inline
int xe_svm_alloc_vram(struct xe_vm *vm, struct xe_tile *tile,
		      struct xe_svm_range *range,
static inline int
xe_svm_alloc_vram(struct xe_tile *tile, struct xe_svm_range *range,
		  const struct drm_gpusvm_ctx *ctx)
{
	return -EOPNOTSUPP;
+11 −0
Original line number Diff line number Diff line
@@ -16,4 +16,15 @@ int xe_tile_init(struct xe_tile *tile);

void xe_tile_migrate_wait(struct xe_tile *tile);

#if IS_ENABLED(CONFIG_DRM_XE_PAGEMAP)
static inline struct drm_pagemap *xe_tile_local_pagemap(struct xe_tile *tile)
{
	return &tile->mem.vram.dpagemap;
}
#else
static inline struct drm_pagemap *xe_tile_local_pagemap(struct xe_tile *tile)
{
	return NULL;
}
#endif
#endif
+1 −1
Original line number Diff line number Diff line
@@ -2913,7 +2913,7 @@ static int prefetch_ranges(struct xe_vm *vm, struct xe_vma_op *op)

		if (xe_svm_range_needs_migrate_to_vram(svm_range, vma, region)) {
			tile = &vm->xe->tiles[region_to_mem_type[region] - XE_PL_VRAM0];
			err = xe_svm_alloc_vram(vm, tile, svm_range, &ctx);
			err = xe_svm_alloc_vram(tile, svm_range, &ctx);
			if (err) {
				drm_dbg(&vm->xe->drm, "VRAM allocation failed, retry from userspace, asid=%u, gpusvm=%p, errno=%pe\n",
					vm->usm.asid, &vm->svm.gpusvm, ERR_PTR(err));