323 lines
10 KiB
C
323 lines
10 KiB
C
|
// SPDX-License-Identifier: MIT
|
||
|
/*
|
||
|
* Copyright © 2017-2019 Intel Corporation
|
||
|
*/
|
||
|
|
||
|
#include "intel_wopcm.h"
|
||
|
#include "i915_drv.h"
|
||
|
|
||
|
/**
|
||
|
* DOC: WOPCM Layout
|
||
|
*
|
||
|
* The layout of the WOPCM will be fixed after writing to GuC WOPCM size and
|
||
|
* offset registers whose values are calculated and determined by HuC/GuC
|
||
|
* firmware size and set of hardware requirements/restrictions as shown below:
|
||
|
*
|
||
|
* ::
|
||
|
*
|
||
|
* +=========> +====================+ <== WOPCM Top
|
||
|
* ^ | HW contexts RSVD |
|
||
|
* | +===> +====================+ <== GuC WOPCM Top
|
||
|
* | ^ | |
|
||
|
* | | | |
|
||
|
* | | | |
|
||
|
* | GuC | |
|
||
|
* | WOPCM | |
|
||
|
* | Size +--------------------+
|
||
|
* WOPCM | | GuC FW RSVD |
|
||
|
* | | +--------------------+
|
||
|
* | | | GuC Stack RSVD |
|
||
|
* | | +------------------- +
|
||
|
* | v | GuC WOPCM RSVD |
|
||
|
* | +===> +====================+ <== GuC WOPCM base
|
||
|
* | | WOPCM RSVD |
|
||
|
* | +------------------- + <== HuC Firmware Top
|
||
|
* v | HuC FW |
|
||
|
* +=========> +====================+ <== WOPCM Base
|
||
|
*
|
||
|
* GuC accessible WOPCM starts at GuC WOPCM base and ends at GuC WOPCM top.
|
||
|
* The top part of the WOPCM is reserved for hardware contexts (e.g. RC6
|
||
|
* context).
|
||
|
*/
|
||
|
|
||
|
/* Default WOPCM size is 2MB from Gen11, 1MB on previous platforms */
|
||
|
#define GEN11_WOPCM_SIZE SZ_2M
|
||
|
#define GEN9_WOPCM_SIZE SZ_1M
|
||
|
#define MAX_WOPCM_SIZE SZ_8M
|
||
|
/* 16KB WOPCM (RSVD WOPCM) is reserved from HuC firmware top. */
|
||
|
#define WOPCM_RESERVED_SIZE SZ_16K
|
||
|
|
||
|
/* 16KB reserved at the beginning of GuC WOPCM. */
|
||
|
#define GUC_WOPCM_RESERVED SZ_16K
|
||
|
/* 8KB from GUC_WOPCM_RESERVED is reserved for GuC stack. */
|
||
|
#define GUC_WOPCM_STACK_RESERVED SZ_8K
|
||
|
|
||
|
/* GuC WOPCM Offset value needs to be aligned to 16KB. */
|
||
|
#define GUC_WOPCM_OFFSET_ALIGNMENT (1UL << GUC_WOPCM_OFFSET_SHIFT)
|
||
|
|
||
|
/* 24KB at the end of WOPCM is reserved for RC6 CTX on BXT. */
|
||
|
#define BXT_WOPCM_RC6_CTX_RESERVED (SZ_16K + SZ_8K)
|
||
|
/* 36KB WOPCM reserved at the end of WOPCM on ICL. */
|
||
|
#define ICL_WOPCM_HW_CTX_RESERVED (SZ_32K + SZ_4K)
|
||
|
|
||
|
/* 128KB from GUC_WOPCM_RESERVED is reserved for FW on Gen9. */
|
||
|
#define GEN9_GUC_FW_RESERVED SZ_128K
|
||
|
#define GEN9_GUC_WOPCM_OFFSET (GUC_WOPCM_RESERVED + GEN9_GUC_FW_RESERVED)
|
||
|
|
||
|
static inline struct intel_gt *wopcm_to_gt(struct intel_wopcm *wopcm)
|
||
|
{
|
||
|
return container_of(wopcm, struct intel_gt, wopcm);
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* intel_wopcm_init_early() - Early initialization of the WOPCM.
|
||
|
* @wopcm: pointer to intel_wopcm.
|
||
|
*
|
||
|
* Setup the size of WOPCM which will be used by later on WOPCM partitioning.
|
||
|
*/
|
||
|
void intel_wopcm_init_early(struct intel_wopcm *wopcm)
|
||
|
{
|
||
|
struct intel_gt *gt = wopcm_to_gt(wopcm);
|
||
|
struct drm_i915_private *i915 = gt->i915;
|
||
|
|
||
|
if (!HAS_GT_UC(i915))
|
||
|
return;
|
||
|
|
||
|
if (GRAPHICS_VER(i915) >= 11)
|
||
|
wopcm->size = GEN11_WOPCM_SIZE;
|
||
|
else
|
||
|
wopcm->size = GEN9_WOPCM_SIZE;
|
||
|
|
||
|
drm_dbg(&i915->drm, "WOPCM: %uK\n", wopcm->size / 1024);
|
||
|
}
|
||
|
|
||
|
static u32 context_reserved_size(struct drm_i915_private *i915)
|
||
|
{
|
||
|
if (IS_GEN9_LP(i915))
|
||
|
return BXT_WOPCM_RC6_CTX_RESERVED;
|
||
|
else if (GRAPHICS_VER(i915) >= 11)
|
||
|
return ICL_WOPCM_HW_CTX_RESERVED;
|
||
|
else
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
static bool gen9_check_dword_gap(struct drm_i915_private *i915,
|
||
|
u32 guc_wopcm_base, u32 guc_wopcm_size)
|
||
|
{
|
||
|
u32 offset;
|
||
|
|
||
|
/*
|
||
|
* GuC WOPCM size shall be at least a dword larger than the offset from
|
||
|
* WOPCM base (GuC WOPCM offset from WOPCM base + GEN9_GUC_WOPCM_OFFSET)
|
||
|
* due to hardware limitation on Gen9.
|
||
|
*/
|
||
|
offset = guc_wopcm_base + GEN9_GUC_WOPCM_OFFSET;
|
||
|
if (offset > guc_wopcm_size ||
|
||
|
(guc_wopcm_size - offset) < sizeof(u32)) {
|
||
|
drm_err(&i915->drm,
|
||
|
"WOPCM: invalid GuC region size: %uK < %uK\n",
|
||
|
guc_wopcm_size / SZ_1K,
|
||
|
(u32)(offset + sizeof(u32)) / SZ_1K);
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
static bool gen9_check_huc_fw_fits(struct drm_i915_private *i915,
|
||
|
u32 guc_wopcm_size, u32 huc_fw_size)
|
||
|
{
|
||
|
/*
|
||
|
* On Gen9, hardware requires the total available GuC WOPCM
|
||
|
* size to be larger than or equal to HuC firmware size. Otherwise,
|
||
|
* firmware uploading would fail.
|
||
|
*/
|
||
|
if (huc_fw_size > guc_wopcm_size - GUC_WOPCM_RESERVED) {
|
||
|
drm_err(&i915->drm, "WOPCM: no space for %s: %uK < %uK\n",
|
||
|
intel_uc_fw_type_repr(INTEL_UC_FW_TYPE_HUC),
|
||
|
(guc_wopcm_size - GUC_WOPCM_RESERVED) / SZ_1K,
|
||
|
huc_fw_size / 1024);
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
static bool check_hw_restrictions(struct drm_i915_private *i915,
|
||
|
u32 guc_wopcm_base, u32 guc_wopcm_size,
|
||
|
u32 huc_fw_size)
|
||
|
{
|
||
|
if (GRAPHICS_VER(i915) == 9 && !gen9_check_dword_gap(i915, guc_wopcm_base,
|
||
|
guc_wopcm_size))
|
||
|
return false;
|
||
|
|
||
|
if (GRAPHICS_VER(i915) == 9 &&
|
||
|
!gen9_check_huc_fw_fits(i915, guc_wopcm_size, huc_fw_size))
|
||
|
return false;
|
||
|
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
static bool __check_layout(struct intel_gt *gt, u32 wopcm_size,
|
||
|
u32 guc_wopcm_base, u32 guc_wopcm_size,
|
||
|
u32 guc_fw_size, u32 huc_fw_size)
|
||
|
{
|
||
|
struct drm_i915_private *i915 = gt->i915;
|
||
|
const u32 ctx_rsvd = context_reserved_size(i915);
|
||
|
u32 size;
|
||
|
|
||
|
size = wopcm_size - ctx_rsvd;
|
||
|
if (unlikely(range_overflows(guc_wopcm_base, guc_wopcm_size, size))) {
|
||
|
drm_err(&i915->drm,
|
||
|
"WOPCM: invalid GuC region layout: %uK + %uK > %uK\n",
|
||
|
guc_wopcm_base / SZ_1K, guc_wopcm_size / SZ_1K,
|
||
|
size / SZ_1K);
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
size = guc_fw_size + GUC_WOPCM_RESERVED + GUC_WOPCM_STACK_RESERVED;
|
||
|
if (unlikely(guc_wopcm_size < size)) {
|
||
|
drm_err(&i915->drm, "WOPCM: no space for %s: %uK < %uK\n",
|
||
|
intel_uc_fw_type_repr(INTEL_UC_FW_TYPE_GUC),
|
||
|
guc_wopcm_size / SZ_1K, size / SZ_1K);
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
if (intel_uc_supports_huc(>->uc)) {
|
||
|
size = huc_fw_size + WOPCM_RESERVED_SIZE;
|
||
|
if (unlikely(guc_wopcm_base < size)) {
|
||
|
drm_err(&i915->drm, "WOPCM: no space for %s: %uK < %uK\n",
|
||
|
intel_uc_fw_type_repr(INTEL_UC_FW_TYPE_HUC),
|
||
|
guc_wopcm_base / SZ_1K, size / SZ_1K);
|
||
|
return false;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
return check_hw_restrictions(i915, guc_wopcm_base, guc_wopcm_size,
|
||
|
huc_fw_size);
|
||
|
}
|
||
|
|
||
|
static bool __wopcm_regs_locked(struct intel_uncore *uncore,
|
||
|
u32 *guc_wopcm_base, u32 *guc_wopcm_size)
|
||
|
{
|
||
|
u32 reg_base = intel_uncore_read(uncore, DMA_GUC_WOPCM_OFFSET);
|
||
|
u32 reg_size = intel_uncore_read(uncore, GUC_WOPCM_SIZE);
|
||
|
|
||
|
if (!(reg_size & GUC_WOPCM_SIZE_LOCKED) ||
|
||
|
!(reg_base & GUC_WOPCM_OFFSET_VALID))
|
||
|
return false;
|
||
|
|
||
|
*guc_wopcm_base = reg_base & GUC_WOPCM_OFFSET_MASK;
|
||
|
*guc_wopcm_size = reg_size & GUC_WOPCM_SIZE_MASK;
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
static bool __wopcm_regs_writable(struct intel_uncore *uncore)
|
||
|
{
|
||
|
if (!HAS_GUC_DEPRIVILEGE(uncore->i915))
|
||
|
return true;
|
||
|
|
||
|
return intel_uncore_read(uncore, GUC_SHIM_CONTROL2) & GUC_IS_PRIVILEGED;
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* intel_wopcm_init() - Initialize the WOPCM structure.
|
||
|
* @wopcm: pointer to intel_wopcm.
|
||
|
*
|
||
|
* This function will partition WOPCM space based on GuC and HuC firmware sizes
|
||
|
* and will allocate max remaining for use by GuC. This function will also
|
||
|
* enforce platform dependent hardware restrictions on GuC WOPCM offset and
|
||
|
* size. It will fail the WOPCM init if any of these checks fail, so that the
|
||
|
* following WOPCM registers setup and GuC firmware uploading would be aborted.
|
||
|
*/
|
||
|
void intel_wopcm_init(struct intel_wopcm *wopcm)
|
||
|
{
|
||
|
struct intel_gt *gt = wopcm_to_gt(wopcm);
|
||
|
struct drm_i915_private *i915 = gt->i915;
|
||
|
u32 guc_fw_size = intel_uc_fw_get_upload_size(>->uc.guc.fw);
|
||
|
u32 huc_fw_size = intel_uc_fw_get_upload_size(>->uc.huc.fw);
|
||
|
u32 ctx_rsvd = context_reserved_size(i915);
|
||
|
u32 wopcm_size = wopcm->size;
|
||
|
u32 guc_wopcm_base;
|
||
|
u32 guc_wopcm_size;
|
||
|
|
||
|
if (!guc_fw_size)
|
||
|
return;
|
||
|
|
||
|
GEM_BUG_ON(!wopcm_size);
|
||
|
GEM_BUG_ON(wopcm->guc.base);
|
||
|
GEM_BUG_ON(wopcm->guc.size);
|
||
|
GEM_BUG_ON(guc_fw_size >= wopcm_size);
|
||
|
GEM_BUG_ON(huc_fw_size >= wopcm_size);
|
||
|
GEM_BUG_ON(ctx_rsvd + WOPCM_RESERVED_SIZE >= wopcm_size);
|
||
|
|
||
|
if (i915_inject_probe_failure(i915))
|
||
|
return;
|
||
|
|
||
|
if (__wopcm_regs_locked(gt->uncore, &guc_wopcm_base, &guc_wopcm_size)) {
|
||
|
drm_dbg(&i915->drm, "GuC WOPCM is already locked [%uK, %uK)\n",
|
||
|
guc_wopcm_base / SZ_1K, guc_wopcm_size / SZ_1K);
|
||
|
/*
|
||
|
* Note that to keep things simple (i.e. avoid different
|
||
|
* defines per platform) our WOPCM math doesn't always use the
|
||
|
* actual WOPCM size, but a value that is less or equal to it.
|
||
|
* This is perfectly fine when i915 programs the registers, but
|
||
|
* on platforms with GuC deprivilege the registers are not
|
||
|
* writable from i915 and are instead pre-programmed by the
|
||
|
* bios/IFWI, so there might be a mismatch of sizes.
|
||
|
* Instead of handling the size difference, we trust that the
|
||
|
* programmed values make sense and disable the relevant check
|
||
|
* by using the maximum possible WOPCM size in the verification
|
||
|
* math. In the extremely unlikely case that the registers
|
||
|
* were pre-programmed with an invalid value, we will still
|
||
|
* gracefully fail later during the GuC/HuC dma.
|
||
|
*/
|
||
|
if (!__wopcm_regs_writable(gt->uncore))
|
||
|
wopcm_size = MAX_WOPCM_SIZE;
|
||
|
|
||
|
goto check;
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* On platforms with a media GT, the WOPCM is partitioned between the
|
||
|
* two GTs, so we would have to take that into account when doing the
|
||
|
* math below. There is also a new section reserved for the GSC context
|
||
|
* that would have to be factored in. However, all platforms with a
|
||
|
* media GT also have GuC depriv enabled, so the WOPCM regs are
|
||
|
* pre-locked and therefore we don't have to do the math ourselves.
|
||
|
*/
|
||
|
if (unlikely(i915->media_gt)) {
|
||
|
drm_err(&i915->drm, "Unlocked WOPCM regs with media GT\n");
|
||
|
return;
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* Aligned value of guc_wopcm_base will determine available WOPCM space
|
||
|
* for HuC firmware and mandatory reserved area.
|
||
|
*/
|
||
|
guc_wopcm_base = huc_fw_size + WOPCM_RESERVED_SIZE;
|
||
|
guc_wopcm_base = ALIGN(guc_wopcm_base, GUC_WOPCM_OFFSET_ALIGNMENT);
|
||
|
|
||
|
/*
|
||
|
* Need to clamp guc_wopcm_base now to make sure the following math is
|
||
|
* correct. Formal check of whole WOPCM layout will be done below.
|
||
|
*/
|
||
|
guc_wopcm_base = min(guc_wopcm_base, wopcm_size - ctx_rsvd);
|
||
|
|
||
|
/* Aligned remainings of usable WOPCM space can be assigned to GuC. */
|
||
|
guc_wopcm_size = wopcm_size - ctx_rsvd - guc_wopcm_base;
|
||
|
guc_wopcm_size &= GUC_WOPCM_SIZE_MASK;
|
||
|
|
||
|
drm_dbg(&i915->drm, "Calculated GuC WOPCM [%uK, %uK)\n",
|
||
|
guc_wopcm_base / SZ_1K, guc_wopcm_size / SZ_1K);
|
||
|
|
||
|
check:
|
||
|
if (__check_layout(gt, wopcm_size, guc_wopcm_base, guc_wopcm_size,
|
||
|
guc_fw_size, huc_fw_size)) {
|
||
|
wopcm->guc.base = guc_wopcm_base;
|
||
|
wopcm->guc.size = guc_wopcm_size;
|
||
|
GEM_BUG_ON(!wopcm->guc.base);
|
||
|
GEM_BUG_ON(!wopcm->guc.size);
|
||
|
}
|
||
|
}
|