| // SPDX-License-Identifier: MIT |
| /* |
| * Copyright © 2019 Intel Corporation |
| */ |
| |
| #include "intel_context.h" |
| #include "intel_engine_pm.h" |
| #include "intel_gpu_commands.h" |
| #include "intel_gt_requests.h" |
| #include "intel_ring.h" |
| #include "selftest_rc6.h" |
| |
| #include "selftests/i915_random.h" |
| #include "selftests/librapl.h" |
| |
| static u64 rc6_residency(struct intel_rc6 *rc6) |
| { |
| u64 result; |
| |
| /* XXX VLV_GT_MEDIA_RC6? */ |
| |
| result = intel_rc6_residency_ns(rc6, INTEL_RC6_RES_RC6); |
| if (HAS_RC6p(rc6_to_i915(rc6))) |
| result += intel_rc6_residency_ns(rc6, INTEL_RC6_RES_RC6p); |
| if (HAS_RC6pp(rc6_to_i915(rc6))) |
| result += intel_rc6_residency_ns(rc6, INTEL_RC6_RES_RC6pp); |
| |
| return result; |
| } |
| |
| int live_rc6_manual(void *arg) |
| { |
| struct intel_gt *gt = arg; |
| struct intel_rc6 *rc6 = >->rc6; |
| u64 rc0_power, rc6_power; |
| intel_wakeref_t wakeref; |
| bool has_power; |
| ktime_t dt; |
| u64 res[2]; |
| int err = 0; |
| |
| /* |
| * Our claim is that we can "encourage" the GPU to enter rc6 at will. |
| * Let's try it! |
| */ |
| |
| if (!rc6->enabled) |
| return 0; |
| |
| /* bsw/byt use a PCU and decouple RC6 from our manual control */ |
| if (IS_VALLEYVIEW(gt->i915) || IS_CHERRYVIEW(gt->i915)) |
| return 0; |
| |
| has_power = librapl_supported(gt->i915); |
| wakeref = intel_runtime_pm_get(gt->uncore->rpm); |
| |
| /* Force RC6 off for starters */ |
| __intel_rc6_disable(rc6); |
| msleep(1); /* wakeup is not immediate, takes about 100us on icl */ |
| |
| res[0] = rc6_residency(rc6); |
| |
| dt = ktime_get(); |
| rc0_power = librapl_energy_uJ(); |
| msleep(1000); |
| rc0_power = librapl_energy_uJ() - rc0_power; |
| dt = ktime_sub(ktime_get(), dt); |
| res[1] = rc6_residency(rc6); |
| if ((res[1] - res[0]) >> 10) { |
| pr_err("RC6 residency increased by %lldus while disabled for 1000ms!\n", |
| (res[1] - res[0]) >> 10); |
| err = -EINVAL; |
| goto out_unlock; |
| } |
| |
| if (has_power) { |
| rc0_power = div64_u64(NSEC_PER_SEC * rc0_power, |
| ktime_to_ns(dt)); |
| if (!rc0_power) { |
| pr_err("No power measured while in RC0\n"); |
| err = -EINVAL; |
| goto out_unlock; |
| } |
| } |
| |
| /* Manually enter RC6 */ |
| intel_rc6_park(rc6); |
| |
| res[0] = rc6_residency(rc6); |
| intel_uncore_forcewake_flush(rc6_to_uncore(rc6), FORCEWAKE_ALL); |
| dt = ktime_get(); |
| rc6_power = librapl_energy_uJ(); |
| msleep(100); |
| rc6_power = librapl_energy_uJ() - rc6_power; |
| dt = ktime_sub(ktime_get(), dt); |
| res[1] = rc6_residency(rc6); |
| if (res[1] == res[0]) { |
| pr_err("Did not enter RC6! RC6_STATE=%08x, RC6_CONTROL=%08x, residency=%lld\n", |
| intel_uncore_read_fw(gt->uncore, GEN6_RC_STATE), |
| intel_uncore_read_fw(gt->uncore, GEN6_RC_CONTROL), |
| res[0]); |
| err = -EINVAL; |
| } |
| |
| if (has_power) { |
| rc6_power = div64_u64(NSEC_PER_SEC * rc6_power, |
| ktime_to_ns(dt)); |
| pr_info("GPU consumed %llduW in RC0 and %llduW in RC6\n", |
| rc0_power, rc6_power); |
| if (2 * rc6_power > rc0_power) { |
| pr_err("GPU leaked energy while in RC6!\n"); |
| err = -EINVAL; |
| goto out_unlock; |
| } |
| } |
| |
| /* Restore what should have been the original state! */ |
| intel_rc6_unpark(rc6); |
| |
| out_unlock: |
| intel_runtime_pm_put(gt->uncore->rpm, wakeref); |
| return err; |
| } |
| |
| static const u32 *__live_rc6_ctx(struct intel_context *ce) |
| { |
| struct i915_request *rq; |
| const u32 *result; |
| u32 cmd; |
| u32 *cs; |
| |
| rq = intel_context_create_request(ce); |
| if (IS_ERR(rq)) |
| return ERR_CAST(rq); |
| |
| cs = intel_ring_begin(rq, 4); |
| if (IS_ERR(cs)) { |
| i915_request_add(rq); |
| return cs; |
| } |
| |
| cmd = MI_STORE_REGISTER_MEM | MI_USE_GGTT; |
| if (GRAPHICS_VER(rq->i915) >= 8) |
| cmd++; |
| |
| *cs++ = cmd; |
| *cs++ = i915_mmio_reg_offset(GEN8_RC6_CTX_INFO); |
| *cs++ = ce->timeline->hwsp_offset + 8; |
| *cs++ = 0; |
| intel_ring_advance(rq, cs); |
| |
| result = rq->hwsp_seqno + 2; |
| i915_request_add(rq); |
| |
| return result; |
| } |
| |
| static struct intel_engine_cs ** |
| randomised_engines(struct intel_gt *gt, |
| struct rnd_state *prng, |
| unsigned int *count) |
| { |
| struct intel_engine_cs *engine, **engines; |
| enum intel_engine_id id; |
| int n; |
| |
| n = 0; |
| for_each_engine(engine, gt, id) |
| n++; |
| if (!n) |
| return NULL; |
| |
| engines = kmalloc_array(n, sizeof(*engines), GFP_KERNEL); |
| if (!engines) |
| return NULL; |
| |
| n = 0; |
| for_each_engine(engine, gt, id) |
| engines[n++] = engine; |
| |
| i915_prandom_shuffle(engines, sizeof(*engines), n, prng); |
| |
| *count = n; |
| return engines; |
| } |
| |
| int live_rc6_ctx_wa(void *arg) |
| { |
| struct intel_gt *gt = arg; |
| struct intel_engine_cs **engines; |
| unsigned int n, count; |
| I915_RND_STATE(prng); |
| int err = 0; |
| |
| /* A read of CTX_INFO upsets rc6. Poke the bear! */ |
| if (GRAPHICS_VER(gt->i915) < 8) |
| return 0; |
| |
| engines = randomised_engines(gt, &prng, &count); |
| if (!engines) |
| return 0; |
| |
| for (n = 0; n < count; n++) { |
| struct intel_engine_cs *engine = engines[n]; |
| int pass; |
| |
| for (pass = 0; pass < 2; pass++) { |
| struct i915_gpu_error *error = >->i915->gpu_error; |
| struct intel_context *ce; |
| unsigned int resets = |
| i915_reset_engine_count(error, engine); |
| const u32 *res; |
| |
| /* Use a sacrifical context */ |
| ce = intel_context_create(engine); |
| if (IS_ERR(ce)) { |
| err = PTR_ERR(ce); |
| goto out; |
| } |
| |
| intel_engine_pm_get(engine); |
| res = __live_rc6_ctx(ce); |
| intel_engine_pm_put(engine); |
| intel_context_put(ce); |
| if (IS_ERR(res)) { |
| err = PTR_ERR(res); |
| goto out; |
| } |
| |
| if (intel_gt_wait_for_idle(gt, HZ / 5) == -ETIME) { |
| intel_gt_set_wedged(gt); |
| err = -ETIME; |
| goto out; |
| } |
| |
| intel_gt_pm_wait_for_idle(gt); |
| pr_debug("%s: CTX_INFO=%0x\n", |
| engine->name, READ_ONCE(*res)); |
| |
| if (resets != |
| i915_reset_engine_count(error, engine)) { |
| pr_err("%s: GPU reset required\n", |
| engine->name); |
| add_taint_for_CI(gt->i915, TAINT_WARN); |
| err = -EIO; |
| goto out; |
| } |
| } |
| } |
| |
| out: |
| kfree(engines); |
| return err; |
| } |