Commit 6acf3d3e authored by Matt Roper's avatar Matt Roper
Browse files

drm/xe: Move number of XeCore fuse registers to graphics descriptor



The number of registers used to express the XeCore mask has some
"special cases" that don't always get inherited by later IP versions so
it's cleaner and simpler to record the numbers in the IP descriptor
rather than adding extra conditions to the standalone get_num_dss_regs()
function.

Note that a minor change here is that we now always treat the number of
registers as 0 for the media GT.  Technically a copy of these fuse
registers does exist in the media GT as well (at the usual
0x380000+$offset location), but the value of those is always supposed to
read back as 0 because media GTs never have any XeCores or EUs.

v2:
 - Add a kunit assertion to catch descriptors that forget to initialize
   either count.  (Gustavo)

Cc: Gustavo Sousa <gustavo.sousa@intel.com>
Reviewed-by: default avatarGustavo Sousa <gustavo.sousa@intel.com>
Link: https://patch.msgid.link/20260205214139.48515-3-matthew.d.roper@intel.com


Signed-off-by: default avatarMatt Roper <matthew.d.roper@intel.com>
parent 91be6115
Loading
Loading
Loading
Loading
+8 −0
Original line number Diff line number Diff line
@@ -19,6 +19,8 @@ static void check_graphics_ip(struct kunit *test)
	const struct xe_ip *param = test->param_value;
	const struct xe_graphics_desc *graphics = param->desc;
	u64 mask = graphics->hw_engine_mask;
	u8 fuse_regs = graphics->num_geometry_xecore_fuse_regs +
		graphics->num_compute_xecore_fuse_regs;

	/* RCS, CCS, and BCS engines are allowed on the graphics IP */
	mask &= ~(XE_HW_ENGINE_RCS_MASK |
@@ -27,6 +29,12 @@ static void check_graphics_ip(struct kunit *test)

	/* Any remaining engines are an error */
	KUNIT_ASSERT_EQ(test, mask, 0);

	/*
	 * All graphics IP should have at least one geometry and/or compute
	 * XeCore fuse register.
	 */
	KUNIT_ASSERT_GE(test, fuse_regs, 1);
}

static void check_media_ip(struct kunit *test)
+7 −30
Original line number Diff line number Diff line
@@ -205,24 +205,6 @@ load_l3_bank_mask(struct xe_gt *gt, xe_l3_bank_mask_t l3_bank_mask)
	}
}

static void
get_num_dss_regs(struct xe_device *xe, int *geometry_regs, int *compute_regs)
{
	if (GRAPHICS_VER(xe) > 20) {
		*geometry_regs = 3;
		*compute_regs = 3;
	} else if (GRAPHICS_VERx100(xe) == 1260) {
		*geometry_regs = 0;
		*compute_regs = 2;
	} else if (GRAPHICS_VERx100(xe) >= 1250) {
		*geometry_regs = 1;
		*compute_regs = 1;
	} else {
		*geometry_regs = 1;
		*compute_regs = 0;
	}
}

void
xe_gt_topology_init(struct xe_gt *gt)
{
@@ -236,23 +218,19 @@ xe_gt_topology_init(struct xe_gt *gt)
		XEHPC_GT_COMPUTE_DSS_ENABLE_EXT,
		XE2_GT_COMPUTE_DSS_2,
	};
	int num_geometry_regs, num_compute_regs;
	struct xe_device *xe = gt_to_xe(gt);
	struct drm_printer p;

	get_num_dss_regs(xe, &num_geometry_regs, &num_compute_regs);

	/*
	 * Register counts returned shouldn't exceed the number of registers
	 * passed as parameters below.
	 */
	xe_gt_assert(gt, num_geometry_regs <= ARRAY_SIZE(geometry_regs));
	xe_gt_assert(gt, num_compute_regs <= ARRAY_SIZE(compute_regs));
	xe_gt_assert(gt, gt->info.num_geometry_xecore_fuse_regs <= ARRAY_SIZE(geometry_regs));
	xe_gt_assert(gt, gt->info.num_compute_xecore_fuse_regs <= ARRAY_SIZE(compute_regs));

	load_dss_mask(gt, gt->fuse_topo.g_dss_mask,
		      num_geometry_regs, geometry_regs);
		      gt->info.num_geometry_xecore_fuse_regs, geometry_regs);
	load_dss_mask(gt, gt->fuse_topo.c_dss_mask,
		      num_compute_regs, compute_regs);
		      gt->info.num_compute_xecore_fuse_regs, compute_regs);

	load_eu_mask(gt, gt->fuse_topo.eu_mask_per_dss, &gt->fuse_topo.eu_type);
	load_l3_bank_mask(gt, gt->fuse_topo.l3_bank_mask);
@@ -330,15 +308,14 @@ xe_l3_bank_mask_ffs(const xe_l3_bank_mask_t mask)
 */
bool xe_gt_topology_has_dss_in_quadrant(struct xe_gt *gt, int quad)
{
	struct xe_device *xe = gt_to_xe(gt);
	xe_dss_mask_t all_dss;
	int g_dss_regs, c_dss_regs, dss_per_quad, quad_first;
	int dss_per_quad, quad_first;

	bitmap_or(all_dss, gt->fuse_topo.g_dss_mask, gt->fuse_topo.c_dss_mask,
		  XE_MAX_DSS_FUSE_BITS);

	get_num_dss_regs(xe, &g_dss_regs, &c_dss_regs);
	dss_per_quad = 32 * max(g_dss_regs, c_dss_regs) / 4;
	dss_per_quad = 32 * max(gt->info.num_geometry_xecore_fuse_regs,
				gt->info.num_compute_xecore_fuse_regs) / 4;

	quad_first = xe_dss_mask_group_ffs(all_dss, dss_per_quad, quad);

+10 −0
Original line number Diff line number Diff line
@@ -144,6 +144,16 @@ struct xe_gt {
		u8 id;
		/** @info.has_indirect_ring_state: GT has indirect ring state support */
		u8 has_indirect_ring_state:1;
		/**
		 * @info.num_geometry_xecore_fuse_regs: Number of 32b-bit fuse
		 * registers the geometry XeCore mask spans.
		 */
		u8 num_geometry_xecore_fuse_regs;
		/**
		 * @info.num_compute_xecore_fuse_regs: Number of 32b-bit fuse
		 * registers the compute XeCore mask spans.
		 */
		u8 num_compute_xecore_fuse_regs;
	} info;

#if IS_ENABLED(CONFIG_DEBUG_FS)
+12 −0
Original line number Diff line number Diff line
@@ -52,6 +52,7 @@ __diag_ignore_all("-Woverride-init", "Allow field overrides in table");

static const struct xe_graphics_desc graphics_xelp = {
	.hw_engine_mask = BIT(XE_HW_ENGINE_RCS0) | BIT(XE_HW_ENGINE_BCS0),
	.num_geometry_xecore_fuse_regs = 1,
};

#define XE_HP_FEATURES \
@@ -62,6 +63,8 @@ static const struct xe_graphics_desc graphics_xehpg = {
		BIT(XE_HW_ENGINE_RCS0) | BIT(XE_HW_ENGINE_BCS0) |
		BIT(XE_HW_ENGINE_CCS0) | BIT(XE_HW_ENGINE_CCS1) |
		BIT(XE_HW_ENGINE_CCS2) | BIT(XE_HW_ENGINE_CCS3),
	.num_geometry_xecore_fuse_regs = 1,
	.num_compute_xecore_fuse_regs = 1,

	XE_HP_FEATURES,
};
@@ -81,12 +84,15 @@ static const struct xe_graphics_desc graphics_xehpc = {
	.has_asid = 1,
	.has_atomic_enable_pte_bit = 1,
	.has_usm = 1,
	.num_compute_xecore_fuse_regs = 2,
};

static const struct xe_graphics_desc graphics_xelpg = {
	.hw_engine_mask =
		BIT(XE_HW_ENGINE_RCS0) | BIT(XE_HW_ENGINE_BCS0) |
		BIT(XE_HW_ENGINE_CCS0),
	.num_geometry_xecore_fuse_regs = 1,
	.num_compute_xecore_fuse_regs = 1,

	XE_HP_FEATURES,
};
@@ -104,6 +110,8 @@ static const struct xe_graphics_desc graphics_xelpg = {

static const struct xe_graphics_desc graphics_xe2 = {
	XE2_GFX_FEATURES,
	.num_geometry_xecore_fuse_regs = 3,
	.num_compute_xecore_fuse_regs = 3,
};

static const struct xe_graphics_desc graphics_xe3p_xpc = {
@@ -114,6 +122,8 @@ static const struct xe_graphics_desc graphics_xe3p_xpc = {
		GENMASK(XE_HW_ENGINE_CCS3, XE_HW_ENGINE_CCS0),
	.multi_queue_engine_class_mask = BIT(XE_ENGINE_CLASS_COPY) |
					 BIT(XE_ENGINE_CLASS_COMPUTE),
	.num_geometry_xecore_fuse_regs = 3,
	.num_compute_xecore_fuse_regs = 3,
};

static const struct xe_media_desc media_xem = {
@@ -782,6 +792,8 @@ static struct xe_gt *alloc_primary_gt(struct xe_tile *tile,
	gt->info.has_indirect_ring_state = graphics_desc->has_indirect_ring_state;
	gt->info.multi_queue_engine_class_mask = graphics_desc->multi_queue_engine_class_mask;
	gt->info.engine_mask = graphics_desc->hw_engine_mask;
	gt->info.num_geometry_xecore_fuse_regs = graphics_desc->num_geometry_xecore_fuse_regs;
	gt->info.num_compute_xecore_fuse_regs = graphics_desc->num_compute_xecore_fuse_regs;

	/*
	 * Before media version 13, the media IP was part of the primary GT
+2 −0
Original line number Diff line number Diff line
@@ -66,6 +66,8 @@ struct xe_device_desc {
struct xe_graphics_desc {
	u64 hw_engine_mask;	/* hardware engines provided by graphics IP */
	u16 multi_queue_engine_class_mask; /* bitmask of engine classes which support multi queue */
	u8 num_geometry_xecore_fuse_regs;
	u8 num_compute_xecore_fuse_regs;

	u8 has_asid:1;
	u8 has_atomic_enable_pte_bit:1;