Commit eca0b720 authored by Chris Wilson's avatar Chris Wilson

drm/i915: Do initial mocs configuration directly

Now that we record the default "goldenstate" context, we do not need to
emit the mocs registers at the start of each context and can simply do
mmio before the first context and capture the registers as part of its
default image. As a consequence, this means that we repeat the mmio
after each engine reset, fixing up any platform and registers that were
zapped by the reset (for those platforms with global not context-saved
settings).

Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=111723
Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=111645Signed-off-by: default avatarChris Wilson <chris@chris-wilson.co.uk>
Cc: Prathap Kumar Valsan <prathap.kumar.valsan@intel.com>
Reviewed-by: default avatarPrathap Kumar Valsan <prathap.kumar.valsan@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20191016090749.7092-1-chris@chris-wilson.co.uk
parent 5f65d5a6
...@@ -287,10 +287,9 @@ static const struct drm_i915_mocs_entry icelake_mocs_table[] = { ...@@ -287,10 +287,9 @@ static const struct drm_i915_mocs_entry icelake_mocs_table[] = {
GEN11_MOCS_ENTRIES GEN11_MOCS_ENTRIES
}; };
static bool get_mocs_settings(struct intel_gt *gt, static bool get_mocs_settings(const struct drm_i915_private *i915,
struct drm_i915_mocs_table *table) struct drm_i915_mocs_table *table)
{ {
struct drm_i915_private *i915 = gt->i915;
bool result = false; bool result = false;
if (INTEL_GEN(i915) >= 12) { if (INTEL_GEN(i915) >= 12) {
...@@ -331,9 +330,9 @@ static bool get_mocs_settings(struct intel_gt *gt, ...@@ -331,9 +330,9 @@ static bool get_mocs_settings(struct intel_gt *gt,
return result; return result;
} }
static i915_reg_t mocs_register(enum intel_engine_id engine_id, int index) static i915_reg_t mocs_register(const struct intel_engine_cs *engine, int index)
{ {
switch (engine_id) { switch (engine->id) {
case RCS0: case RCS0:
return GEN9_GFX_MOCS(index); return GEN9_GFX_MOCS(index);
case VCS0: case VCS0:
...@@ -347,7 +346,7 @@ static i915_reg_t mocs_register(enum intel_engine_id engine_id, int index) ...@@ -347,7 +346,7 @@ static i915_reg_t mocs_register(enum intel_engine_id engine_id, int index)
case VCS2: case VCS2:
return GEN11_MFX2_MOCS(index); return GEN11_MFX2_MOCS(index);
default: default:
MISSING_CASE(engine_id); MISSING_CASE(engine->id);
return INVALID_MMIO_REG; return INVALID_MMIO_REG;
} }
} }
...@@ -365,118 +364,25 @@ static u32 get_entry_control(const struct drm_i915_mocs_table *table, ...@@ -365,118 +364,25 @@ static u32 get_entry_control(const struct drm_i915_mocs_table *table,
return table->table[I915_MOCS_PTE].control_value; return table->table[I915_MOCS_PTE].control_value;
} }
/** static void init_mocs_table(struct intel_engine_cs *engine,
* intel_mocs_init_engine() - emit the mocs control table const struct drm_i915_mocs_table *table)
* @engine: The engine for whom to emit the registers.
*
* This function simply emits a MI_LOAD_REGISTER_IMM command for the
* given table starting at the given address.
*/
void intel_mocs_init_engine(struct intel_engine_cs *engine)
{ {
struct intel_gt *gt = engine->gt; struct intel_uncore *uncore = engine->uncore;
struct intel_uncore *uncore = gt->uncore; u32 unused_value = table->table[I915_MOCS_PTE].control_value;
struct drm_i915_mocs_table table; unsigned int i;
unsigned int index;
u32 unused_value;
/* Platforms with global MOCS do not need per-engine initialization. */
if (HAS_GLOBAL_MOCS_REGISTERS(gt->i915))
return;
/* Called under a blanket forcewake */
assert_forcewakes_active(uncore, FORCEWAKE_ALL);
if (!get_mocs_settings(gt, &table))
return;
/* Set unused values to PTE */
unused_value = table.table[I915_MOCS_PTE].control_value;
for (index = 0; index < table.size; index++) {
u32 value = get_entry_control(&table, index);
for (i = 0; i < table->size; i++)
intel_uncore_write_fw(uncore, intel_uncore_write_fw(uncore,
mocs_register(engine->id, index), mocs_register(engine, i),
value); get_entry_control(table, i));
}
/* All remaining entries are also unused */ /* All remaining entries are unused */
for (; index < table.n_entries; index++) for (; i < table->n_entries; i++)
intel_uncore_write_fw(uncore, intel_uncore_write_fw(uncore,
mocs_register(engine->id, index), mocs_register(engine, i),
unused_value); unused_value);
} }
static void intel_mocs_init_global(struct intel_gt *gt)
{
struct intel_uncore *uncore = gt->uncore;
struct drm_i915_mocs_table table;
unsigned int index;
GEM_BUG_ON(!HAS_GLOBAL_MOCS_REGISTERS(gt->i915));
if (!get_mocs_settings(gt, &table))
return;
if (GEM_DEBUG_WARN_ON(table.size > table.n_entries))
return;
for (index = 0; index < table.size; index++)
intel_uncore_write(uncore,
GEN12_GLOBAL_MOCS(index),
table.table[index].control_value);
/*
* Ok, now set the unused entries to the invalid entry (index 0). These
* entries are officially undefined and no contract for the contents and
* settings is given for these entries.
*/
for (; index < table.n_entries; index++)
intel_uncore_write(uncore,
GEN12_GLOBAL_MOCS(index),
table.table[0].control_value);
}
static int emit_mocs_control_table(struct i915_request *rq,
const struct drm_i915_mocs_table *table)
{
enum intel_engine_id engine = rq->engine->id;
unsigned int index;
u32 unused_value;
u32 *cs;
if (GEM_WARN_ON(table->size > table->n_entries))
return -ENODEV;
/* Set unused values to PTE */
unused_value = table->table[I915_MOCS_PTE].control_value;
cs = intel_ring_begin(rq, 2 + 2 * table->n_entries);
if (IS_ERR(cs))
return PTR_ERR(cs);
*cs++ = MI_LOAD_REGISTER_IMM(table->n_entries);
for (index = 0; index < table->size; index++) {
u32 value = get_entry_control(table, index);
*cs++ = i915_mmio_reg_offset(mocs_register(engine, index));
*cs++ = value;
}
/* All remaining entries are also unused */
for (; index < table->n_entries; index++) {
*cs++ = i915_mmio_reg_offset(mocs_register(engine, index));
*cs++ = unused_value;
}
*cs++ = MI_NOOP;
intel_ring_advance(rq, cs);
return 0;
}
/* /*
* Get l3cc_value from MOCS entry taking into account when it's not used: * Get l3cc_value from MOCS entry taking into account when it's not used:
* I915_MOCS_PTE's value is returned in this case. * I915_MOCS_PTE's value is returned in this case.
...@@ -494,141 +400,93 @@ static inline u32 l3cc_combine(const struct drm_i915_mocs_table *table, ...@@ -494,141 +400,93 @@ static inline u32 l3cc_combine(const struct drm_i915_mocs_table *table,
u16 low, u16 low,
u16 high) u16 high)
{ {
return low | high << 16; return low | (u32)high << 16;
} }
static int emit_mocs_l3cc_table(struct i915_request *rq, static void init_l3cc_table(struct intel_engine_cs *engine,
const struct drm_i915_mocs_table *table) const struct drm_i915_mocs_table *table)
{ {
u16 unused_value; struct intel_uncore *uncore = engine->uncore;
u16 unused_value = table->table[I915_MOCS_PTE].l3cc_value;
unsigned int i; unsigned int i;
u32 *cs;
if (GEM_WARN_ON(table->size > table->n_entries))
return -ENODEV;
/* Set unused values to PTE */
unused_value = table->table[I915_MOCS_PTE].l3cc_value;
cs = intel_ring_begin(rq, 2 + table->n_entries);
if (IS_ERR(cs))
return PTR_ERR(cs);
*cs++ = MI_LOAD_REGISTER_IMM(table->n_entries / 2);
for (i = 0; i < table->size / 2; i++) { for (i = 0; i < table->size / 2; i++) {
u16 low = get_entry_l3cc(table, 2 * i); u16 low = get_entry_l3cc(table, 2 * i);
u16 high = get_entry_l3cc(table, 2 * i + 1); u16 high = get_entry_l3cc(table, 2 * i + 1);
*cs++ = i915_mmio_reg_offset(GEN9_LNCFCMOCS(i)); intel_uncore_write(uncore,
*cs++ = l3cc_combine(table, low, high); GEN9_LNCFCMOCS(i),
l3cc_combine(table, low, high));
} }
/* Odd table size - 1 left over */ /* Odd table size - 1 left over */
if (table->size & 0x01) { if (table->size & 1) {
u16 low = get_entry_l3cc(table, 2 * i); u16 low = get_entry_l3cc(table, 2 * i);
*cs++ = i915_mmio_reg_offset(GEN9_LNCFCMOCS(i)); intel_uncore_write(uncore,
*cs++ = l3cc_combine(table, low, unused_value); GEN9_LNCFCMOCS(i),
l3cc_combine(table, low, unused_value));
i++; i++;
} }
/* All remaining entries are also unused */ /* All remaining entries are also unused */
for (; i < table->n_entries / 2; i++) { for (; i < table->n_entries / 2; i++)
*cs++ = i915_mmio_reg_offset(GEN9_LNCFCMOCS(i)); intel_uncore_write(uncore,
*cs++ = l3cc_combine(table, unused_value, unused_value); GEN9_LNCFCMOCS(i),
} l3cc_combine(table, unused_value,
unused_value));
*cs++ = MI_NOOP;
intel_ring_advance(rq, cs);
return 0;
} }
static void intel_mocs_init_l3cc_table(struct intel_gt *gt) void intel_mocs_init_engine(struct intel_engine_cs *engine)
{ {
struct intel_uncore *uncore = gt->uncore;
struct drm_i915_mocs_table table; struct drm_i915_mocs_table table;
unsigned int i;
u16 unused_value;
if (!get_mocs_settings(gt, &table)) /* Called under a blanket forcewake */
assert_forcewakes_active(engine->uncore, FORCEWAKE_ALL);
if (!get_mocs_settings(engine->i915, &table))
return; return;
/* Set unused values to PTE */ /* Platforms with global MOCS do not need per-engine initialization. */
unused_value = table.table[I915_MOCS_PTE].l3cc_value; if (!HAS_GLOBAL_MOCS_REGISTERS(engine->i915))
init_mocs_table(engine, &table);
for (i = 0; i < table.size / 2; i++) { if (engine->class == RENDER_CLASS)
u16 low = get_entry_l3cc(&table, 2 * i); init_l3cc_table(engine, &table);
u16 high = get_entry_l3cc(&table, 2 * i + 1); }
intel_uncore_write(uncore, static void intel_mocs_init_global(struct intel_gt *gt)
GEN9_LNCFCMOCS(i), {
l3cc_combine(&table, low, high)); struct intel_uncore *uncore = gt->uncore;
} struct drm_i915_mocs_table table;
unsigned int index;
/* Odd table size - 1 left over */ GEM_BUG_ON(!HAS_GLOBAL_MOCS_REGISTERS(gt->i915));
if (table.size & 0x01) {
u16 low = get_entry_l3cc(&table, 2 * i);
intel_uncore_write(uncore, if (!get_mocs_settings(gt->i915, &table))
GEN9_LNCFCMOCS(i), return;
l3cc_combine(&table, low, unused_value));
i++;
}
/* All remaining entries are also unused */ if (GEM_DEBUG_WARN_ON(table.size > table.n_entries))
for (; i < table.n_entries / 2; i++) return;
for (index = 0; index < table.size; index++)
intel_uncore_write(uncore, intel_uncore_write(uncore,
GEN9_LNCFCMOCS(i), GEN12_GLOBAL_MOCS(index),
l3cc_combine(&table, unused_value, table.table[index].control_value);
unused_value));
}
/** /*
* intel_mocs_emit() - program the MOCS register. * Ok, now set the unused entries to the invalid entry (index 0). These
* @rq: Request to use to set up the MOCS tables. * entries are officially undefined and no contract for the contents and
* * settings is given for these entries.
* This function will emit a batch buffer with the values required for
* programming the MOCS register values for all the currently supported
* rings.
*
* These registers are partially stored in the RCS context, so they are
* emitted at the same time so that when a context is created these registers
* are set up. These registers have to be emitted into the start of the
* context as setting the ELSP will re-init some of these registers back
* to the hw values.
*
* Return: 0 on success, otherwise the error status.
*/ */
int intel_mocs_emit(struct i915_request *rq) for (; index < table.n_entries; index++)
{ intel_uncore_write(uncore,
struct drm_i915_mocs_table t; GEN12_GLOBAL_MOCS(index),
int ret; table.table[0].control_value);
if (HAS_GLOBAL_MOCS_REGISTERS(rq->i915) ||
rq->engine->class != RENDER_CLASS)
return 0;
if (get_mocs_settings(rq->engine->gt, &t)) {
/* Program the RCS control registers */
ret = emit_mocs_control_table(rq, &t);
if (ret)
return ret;
/* Now program the l3cc registers */
ret = emit_mocs_l3cc_table(rq, &t);
if (ret)
return ret;
}
return 0;
} }
void intel_mocs_init(struct intel_gt *gt) void intel_mocs_init(struct intel_gt *gt)
{ {
intel_mocs_init_l3cc_table(gt);
if (HAS_GLOBAL_MOCS_REGISTERS(gt->i915)) if (HAS_GLOBAL_MOCS_REGISTERS(gt->i915))
intel_mocs_init_global(gt); intel_mocs_init_global(gt);
} }
...@@ -49,13 +49,10 @@ ...@@ -49,13 +49,10 @@
* context handling keep the MOCS in step. * context handling keep the MOCS in step.
*/ */
struct i915_request;
struct intel_engine_cs; struct intel_engine_cs;
struct intel_gt; struct intel_gt;
void intel_mocs_init(struct intel_gt *gt); void intel_mocs_init(struct intel_gt *gt);
void intel_mocs_init_engine(struct intel_engine_cs *engine); void intel_mocs_init_engine(struct intel_engine_cs *engine);
int intel_mocs_emit(struct i915_request *rq);
#endif #endif
...@@ -1111,15 +1111,6 @@ static int __intel_engines_record_defaults(struct drm_i915_private *i915) ...@@ -1111,15 +1111,6 @@ static int __intel_engines_record_defaults(struct drm_i915_private *i915)
if (err) if (err)
goto err_rq; goto err_rq;
/*
* Failing to program the MOCS is non-fatal.The system will not
* run at peak performance. So warn the user and carry on.
*/
err = intel_mocs_emit(rq);
if (err)
dev_notice(i915->drm.dev,
"Failed to program MOCS registers; expect performance issues.\n");
err = intel_renderstate_emit(rq); err = intel_renderstate_emit(rq);
if (err) if (err)
goto err_rq; goto err_rq;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment