diff options
| author | Dmitry Torokhov <[email protected]> | 2023-08-30 16:06:38 -0700 | 
|---|---|---|
| committer | Dmitry Torokhov <[email protected]> | 2023-08-30 16:06:38 -0700 | 
| commit | 1ac731c529cd4d6adbce134754b51ff7d822b145 (patch) | |
| tree | 143ab3f35ca5f3b69f583c84e6964b17139c2ec1 /drivers/gpu/drm/i915/gt/intel_gt.c | |
| parent | 07b4c950f27bef0362dc6ad7ee713aab61d58149 (diff) | |
| parent | 54116d442e001e1b6bd482122043b1870998a1f3 (diff) | |
Merge branch 'next' into for-linus
Prepare input updates for 6.6 merge window.
Diffstat (limited to 'drivers/gpu/drm/i915/gt/intel_gt.c')
| -rw-r--r-- | drivers/gpu/drm/i915/gt/intel_gt.c | 170 | 
1 files changed, 51 insertions, 119 deletions
diff --git a/drivers/gpu/drm/i915/gt/intel_gt.c b/drivers/gpu/drm/i915/gt/intel_gt.c index f0dbfc434e07..7a008e829d4d 100644 --- a/drivers/gpu/drm/i915/gt/intel_gt.c +++ b/drivers/gpu/drm/i915/gt/intel_gt.c @@ -28,7 +28,6 @@  #include "intel_migrate.h"  #include "intel_mocs.h"  #include "intel_pci_config.h" -#include "intel_pm.h"  #include "intel_rc6.h"  #include "intel_renderstate.h"  #include "intel_rps.h" @@ -737,12 +736,12 @@ int intel_gt_init(struct intel_gt *gt)  	if (err)  		goto err_gt; -	intel_uc_init_late(>->uc); -  	err = i915_inject_probe_error(gt->i915, -EIO);  	if (err)  		goto err_gt; +	intel_uc_init_late(>->uc); +  	intel_migrate_init(>->migrate, gt);  	goto out_fw; @@ -785,6 +784,29 @@ void intel_gt_driver_unregister(struct intel_gt *gt)  	intel_gsc_fini(>->gsc);  	/* +	 * If we unload the driver and wedge before the GSC worker is complete, +	 * the worker will hit an error on its submission to the GSC engine and +	 * then exit. This is hard to hit for a user, but it is reproducible +	 * with skipping selftests. The error is handled gracefully by the +	 * worker, so there are no functional issues, but we still end up with +	 * an error message in dmesg, which is something we want to avoid as +	 * this is a supported scenario. We could modify the worker to better +	 * handle a wedging occurring during its execution, but that gets +	 * complicated for a couple of reasons: +	 * - We do want the error on runtime wedging, because there are +	 *   implications for subsystems outside of GT (i.e., PXP, HDCP), it's +	 *   only the error on driver unload that we want to silence. +	 * - The worker is responsible for multiple submissions (GSC FW load, +	 *   HuC auth, SW proxy), so all of those will have to be adapted to +	 *   handle the wedged_on_fini scenario. +	 * Therefore, it's much simpler to just wait for the worker to be done +	 * before wedging on driver removal, also considering that the worker +	 * will likely already be idle in the great majority of non-selftest +	 * scenarios. +	 */ +	intel_gsc_uc_flush_work(>->uc.gsc); + +	/*  	 * Upon unregistering the device to prevent any new users, cancel  	 * all in-flight requests so that we can quickly unbind the active  	 * resources. @@ -982,35 +1004,6 @@ void intel_gt_info_print(const struct intel_gt_info *info,  	intel_sseu_dump(&info->sseu, p);  } -struct reg_and_bit { -	union { -		i915_reg_t reg; -		i915_mcr_reg_t mcr_reg; -	}; -	u32 bit; -}; - -static struct reg_and_bit -get_reg_and_bit(const struct intel_engine_cs *engine, const bool gen8, -		const i915_reg_t *regs, const unsigned int num) -{ -	const unsigned int class = engine->class; -	struct reg_and_bit rb = { }; - -	if (gt_WARN_ON_ONCE(engine->gt, class >= num || !regs[class].reg)) -		return rb; - -	rb.reg = regs[class]; -	if (gen8 && class == VIDEO_DECODE_CLASS) -		rb.reg.reg += 4 * engine->instance; /* GEN8_M2TCR */ -	else -		rb.bit = engine->instance; - -	rb.bit = BIT(rb.bit); - -	return rb; -} -  /*   * HW architecture suggest typical invalidation time at 40us,   * with pessimistic cases up to 100us and a recommendation to @@ -1024,14 +1017,20 @@ get_reg_and_bit(const struct intel_engine_cs *engine, const bool gen8,   * but are now considered MCR registers.  Since they exist within a GAM range,   * the primary instance of the register rolls up the status from each unit.   */ -static int wait_for_invalidate(struct intel_gt *gt, struct reg_and_bit rb) +static int wait_for_invalidate(struct intel_engine_cs *engine)  { -	if (GRAPHICS_VER_FULL(gt->i915) >= IP_VER(12, 50)) -		return intel_gt_mcr_wait_for_reg(gt, rb.mcr_reg, rb.bit, 0, +	if (engine->tlb_inv.mcr) +		return intel_gt_mcr_wait_for_reg(engine->gt, +						 engine->tlb_inv.reg.mcr_reg, +						 engine->tlb_inv.done, +						 0,  						 TLB_INVAL_TIMEOUT_US,  						 TLB_INVAL_TIMEOUT_MS);  	else -		return __intel_wait_for_register_fw(gt->uncore, rb.reg, rb.bit, 0, +		return __intel_wait_for_register_fw(engine->gt->uncore, +						    engine->tlb_inv.reg.reg, +						    engine->tlb_inv.done, +						    0,  						    TLB_INVAL_TIMEOUT_US,  						    TLB_INVAL_TIMEOUT_MS,  						    NULL); @@ -1039,62 +1038,14 @@ static int wait_for_invalidate(struct intel_gt *gt, struct reg_and_bit rb)  static void mmio_invalidate_full(struct intel_gt *gt)  { -	static const i915_reg_t gen8_regs[] = { -		[RENDER_CLASS]			= GEN8_RTCR, -		[VIDEO_DECODE_CLASS]		= GEN8_M1TCR, /* , GEN8_M2TCR */ -		[VIDEO_ENHANCEMENT_CLASS]	= GEN8_VTCR, -		[COPY_ENGINE_CLASS]		= GEN8_BTCR, -	}; -	static const i915_reg_t gen12_regs[] = { -		[RENDER_CLASS]			= GEN12_GFX_TLB_INV_CR, -		[VIDEO_DECODE_CLASS]		= GEN12_VD_TLB_INV_CR, -		[VIDEO_ENHANCEMENT_CLASS]	= GEN12_VE_TLB_INV_CR, -		[COPY_ENGINE_CLASS]		= GEN12_BLT_TLB_INV_CR, -		[COMPUTE_CLASS]			= GEN12_COMPCTX_TLB_INV_CR, -	}; -	static const i915_mcr_reg_t xehp_regs[] = { -		[RENDER_CLASS]			= XEHP_GFX_TLB_INV_CR, -		[VIDEO_DECODE_CLASS]		= XEHP_VD_TLB_INV_CR, -		[VIDEO_ENHANCEMENT_CLASS]	= XEHP_VE_TLB_INV_CR, -		[COPY_ENGINE_CLASS]		= XEHP_BLT_TLB_INV_CR, -		[COMPUTE_CLASS]			= XEHP_COMPCTX_TLB_INV_CR, -	};  	struct drm_i915_private *i915 = gt->i915;  	struct intel_uncore *uncore = gt->uncore;  	struct intel_engine_cs *engine;  	intel_engine_mask_t awake, tmp;  	enum intel_engine_id id; -	const i915_reg_t *regs; -	unsigned int num = 0;  	unsigned long flags; -	/* -	 * New platforms should not be added with catch-all-newer (>=) -	 * condition so that any later platform added triggers the below warning -	 * and in turn mandates a human cross-check of whether the invalidation -	 * flows have compatible semantics. -	 * -	 * For instance with the 11.00 -> 12.00 transition three out of five -	 * respective engine registers were moved to masked type. Then after the -	 * 12.00 -> 12.50 transition multi cast handling is required too. -	 */ - -	if (GRAPHICS_VER_FULL(i915) == IP_VER(12, 50) || -	    GRAPHICS_VER_FULL(i915) == IP_VER(12, 55)) { -		regs = NULL; -		num = ARRAY_SIZE(xehp_regs); -	} else if (GRAPHICS_VER_FULL(i915) == IP_VER(12, 0) || -		   GRAPHICS_VER_FULL(i915) == IP_VER(12, 10)) { -		regs = gen12_regs; -		num = ARRAY_SIZE(gen12_regs); -	} else if (GRAPHICS_VER(i915) >= 8 && GRAPHICS_VER(i915) <= 11) { -		regs = gen8_regs; -		num = ARRAY_SIZE(gen8_regs); -	} else if (GRAPHICS_VER(i915) < 8) { -		return; -	} - -	if (gt_WARN_ONCE(gt, !num, "Platform does not implement TLB invalidation!")) +	if (GRAPHICS_VER(i915) < 8)  		return;  	intel_uncore_forcewake_get(uncore, FORCEWAKE_ALL); @@ -1104,33 +1055,18 @@ static void mmio_invalidate_full(struct intel_gt *gt)  	awake = 0;  	for_each_engine(engine, gt, id) { -		struct reg_and_bit rb; -  		if (!intel_engine_pm_is_awake(engine))  			continue; -		if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) { -			u32 val = BIT(engine->instance); - -			if (engine->class == VIDEO_DECODE_CLASS || -			    engine->class == VIDEO_ENHANCEMENT_CLASS || -			    engine->class == COMPUTE_CLASS) -				val = _MASKED_BIT_ENABLE(val); +		if (engine->tlb_inv.mcr)  			intel_gt_mcr_multicast_write_fw(gt, -							xehp_regs[engine->class], -							val); -		} else { -			rb = get_reg_and_bit(engine, regs == gen8_regs, regs, num); -			if (!i915_mmio_reg_offset(rb.reg)) -				continue; - -			if (GRAPHICS_VER(i915) == 12 && (engine->class == VIDEO_DECODE_CLASS || -			    engine->class == VIDEO_ENHANCEMENT_CLASS || -			    engine->class == COMPUTE_CLASS)) -				rb.bit = _MASKED_BIT_ENABLE(rb.bit); - -			intel_uncore_write_fw(uncore, rb.reg, rb.bit); -		} +							engine->tlb_inv.reg.mcr_reg, +							engine->tlb_inv.request); +		else +			intel_uncore_write_fw(uncore, +					      engine->tlb_inv.reg.reg, +					      engine->tlb_inv.request); +  		awake |= engine->mask;  	} @@ -1149,17 +1085,9 @@ static void mmio_invalidate_full(struct intel_gt *gt)  	intel_gt_mcr_unlock(gt, flags);  	for_each_engine_masked(engine, gt, awake, tmp) { -		struct reg_and_bit rb; - -		if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) { -			rb.mcr_reg = xehp_regs[engine->class]; -			rb.bit = BIT(engine->instance); -		} else { -			rb = get_reg_and_bit(engine, regs == gen8_regs, regs, num); -		} - -		if (wait_for_invalidate(gt, rb)) -			gt_err_ratelimited(gt, "%s TLB invalidation did not complete in %ums!\n", +		if (wait_for_invalidate(engine)) +			gt_err_ratelimited(gt, +					   "%s TLB invalidation did not complete in %ums!\n",  					   engine->name, TLB_INVAL_TIMEOUT_MS);  	} @@ -1205,3 +1133,7 @@ unlock:  		mutex_unlock(>->tlb.invalidate_lock);  	}  } + +#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST) +#include "selftest_tlb.c" +#endif  |