1b46a33e2STvrtko Ursulin /* 2b46a33e2STvrtko Ursulin * Copyright © 2017 Intel Corporation 3b46a33e2STvrtko Ursulin * 4b46a33e2STvrtko Ursulin * Permission is hereby granted, free of charge, to any person obtaining a 5b46a33e2STvrtko Ursulin * copy of this software and associated documentation files (the "Software"), 6b46a33e2STvrtko Ursulin * to deal in the Software without restriction, including without limitation 7b46a33e2STvrtko Ursulin * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8b46a33e2STvrtko Ursulin * and/or sell copies of the Software, and to permit persons to whom the 9b46a33e2STvrtko Ursulin * Software is furnished to do so, subject to the following conditions: 10b46a33e2STvrtko Ursulin * 11b46a33e2STvrtko Ursulin * The above copyright notice and this permission notice (including the next 12b46a33e2STvrtko Ursulin * paragraph) shall be included in all copies or substantial portions of the 13b46a33e2STvrtko Ursulin * Software. 14b46a33e2STvrtko Ursulin * 15b46a33e2STvrtko Ursulin * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16b46a33e2STvrtko Ursulin * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17b46a33e2STvrtko Ursulin * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18b46a33e2STvrtko Ursulin * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19b46a33e2STvrtko Ursulin * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 20b46a33e2STvrtko Ursulin * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 21b46a33e2STvrtko Ursulin * IN THE SOFTWARE. 22b46a33e2STvrtko Ursulin * 23b46a33e2STvrtko Ursulin */ 24b46a33e2STvrtko Ursulin 25b46a33e2STvrtko Ursulin #include <linux/perf_event.h> 26b46a33e2STvrtko Ursulin #include <linux/pm_runtime.h> 27b46a33e2STvrtko Ursulin 28b46a33e2STvrtko Ursulin #include "i915_drv.h" 29b46a33e2STvrtko Ursulin #include "i915_pmu.h" 30b46a33e2STvrtko Ursulin #include "intel_ringbuffer.h" 31b46a33e2STvrtko Ursulin 32b46a33e2STvrtko Ursulin /* Frequency for the sampling timer for events which need it. */ 33b46a33e2STvrtko Ursulin #define FREQUENCY 200 34b46a33e2STvrtko Ursulin #define PERIOD max_t(u64, 10000, NSEC_PER_SEC / FREQUENCY) 35b46a33e2STvrtko Ursulin 36b46a33e2STvrtko Ursulin #define ENGINE_SAMPLE_MASK \ 37b46a33e2STvrtko Ursulin (BIT(I915_SAMPLE_BUSY) | \ 38b46a33e2STvrtko Ursulin BIT(I915_SAMPLE_WAIT) | \ 39b46a33e2STvrtko Ursulin BIT(I915_SAMPLE_SEMA)) 40b46a33e2STvrtko Ursulin 41b46a33e2STvrtko Ursulin #define ENGINE_SAMPLE_BITS (1 << I915_PMU_SAMPLE_BITS) 42b46a33e2STvrtko Ursulin 43141a0895SChris Wilson static cpumask_t i915_pmu_cpumask; 44b46a33e2STvrtko Ursulin 45b46a33e2STvrtko Ursulin static u8 engine_config_sample(u64 config) 46b46a33e2STvrtko Ursulin { 47b46a33e2STvrtko Ursulin return config & I915_PMU_SAMPLE_MASK; 48b46a33e2STvrtko Ursulin } 49b46a33e2STvrtko Ursulin 50b46a33e2STvrtko Ursulin static u8 engine_event_sample(struct perf_event *event) 51b46a33e2STvrtko Ursulin { 52b46a33e2STvrtko Ursulin return engine_config_sample(event->attr.config); 53b46a33e2STvrtko Ursulin } 54b46a33e2STvrtko Ursulin 55b46a33e2STvrtko Ursulin static u8 engine_event_class(struct perf_event *event) 56b46a33e2STvrtko Ursulin { 57b46a33e2STvrtko Ursulin return (event->attr.config >> I915_PMU_CLASS_SHIFT) & 0xff; 58b46a33e2STvrtko Ursulin } 59b46a33e2STvrtko Ursulin 60b46a33e2STvrtko Ursulin static u8 engine_event_instance(struct perf_event *event) 61b46a33e2STvrtko Ursulin { 62b46a33e2STvrtko Ursulin return (event->attr.config >> I915_PMU_SAMPLE_BITS) & 0xff; 63b46a33e2STvrtko Ursulin } 64b46a33e2STvrtko Ursulin 65b46a33e2STvrtko Ursulin static bool is_engine_config(u64 config) 66b46a33e2STvrtko Ursulin { 67b46a33e2STvrtko Ursulin return config < __I915_PMU_OTHER(0); 68b46a33e2STvrtko Ursulin } 69b46a33e2STvrtko Ursulin 70b46a33e2STvrtko Ursulin static unsigned int config_enabled_bit(u64 config) 71b46a33e2STvrtko Ursulin { 72b46a33e2STvrtko Ursulin if (is_engine_config(config)) 73b46a33e2STvrtko Ursulin return engine_config_sample(config); 74b46a33e2STvrtko Ursulin else 75b46a33e2STvrtko Ursulin return ENGINE_SAMPLE_BITS + (config - __I915_PMU_OTHER(0)); 76b46a33e2STvrtko Ursulin } 77b46a33e2STvrtko Ursulin 78b46a33e2STvrtko Ursulin static u64 config_enabled_mask(u64 config) 79b46a33e2STvrtko Ursulin { 80b46a33e2STvrtko Ursulin return BIT_ULL(config_enabled_bit(config)); 81b46a33e2STvrtko Ursulin } 82b46a33e2STvrtko Ursulin 83b46a33e2STvrtko Ursulin static bool is_engine_event(struct perf_event *event) 84b46a33e2STvrtko Ursulin { 85b46a33e2STvrtko Ursulin return is_engine_config(event->attr.config); 86b46a33e2STvrtko Ursulin } 87b46a33e2STvrtko Ursulin 88b46a33e2STvrtko Ursulin static unsigned int event_enabled_bit(struct perf_event *event) 89b46a33e2STvrtko Ursulin { 90b46a33e2STvrtko Ursulin return config_enabled_bit(event->attr.config); 91b46a33e2STvrtko Ursulin } 92b46a33e2STvrtko Ursulin 93feff0dc6STvrtko Ursulin static bool pmu_needs_timer(struct drm_i915_private *i915, bool gpu_active) 94feff0dc6STvrtko Ursulin { 95feff0dc6STvrtko Ursulin u64 enable; 96feff0dc6STvrtko Ursulin 97feff0dc6STvrtko Ursulin /* 98feff0dc6STvrtko Ursulin * Only some counters need the sampling timer. 99feff0dc6STvrtko Ursulin * 100feff0dc6STvrtko Ursulin * We start with a bitmask of all currently enabled events. 101feff0dc6STvrtko Ursulin */ 102feff0dc6STvrtko Ursulin enable = i915->pmu.enable; 103feff0dc6STvrtko Ursulin 104feff0dc6STvrtko Ursulin /* 105feff0dc6STvrtko Ursulin * Mask out all the ones which do not need the timer, or in 106feff0dc6STvrtko Ursulin * other words keep all the ones that could need the timer. 107feff0dc6STvrtko Ursulin */ 108feff0dc6STvrtko Ursulin enable &= config_enabled_mask(I915_PMU_ACTUAL_FREQUENCY) | 109feff0dc6STvrtko Ursulin config_enabled_mask(I915_PMU_REQUESTED_FREQUENCY) | 110feff0dc6STvrtko Ursulin ENGINE_SAMPLE_MASK; 111feff0dc6STvrtko Ursulin 112feff0dc6STvrtko Ursulin /* 113feff0dc6STvrtko Ursulin * When the GPU is idle per-engine counters do not need to be 114feff0dc6STvrtko Ursulin * running so clear those bits out. 115feff0dc6STvrtko Ursulin */ 116feff0dc6STvrtko Ursulin if (!gpu_active) 117feff0dc6STvrtko Ursulin enable &= ~ENGINE_SAMPLE_MASK; 118b3add01eSTvrtko Ursulin /* 119b3add01eSTvrtko Ursulin * Also there is software busyness tracking available we do not 120b3add01eSTvrtko Ursulin * need the timer for I915_SAMPLE_BUSY counter. 121cf669b4eSTvrtko Ursulin * 122cf669b4eSTvrtko Ursulin * Use RCS as proxy for all engines. 123b3add01eSTvrtko Ursulin */ 124cf669b4eSTvrtko Ursulin else if (intel_engine_supports_stats(i915->engine[RCS])) 125b3add01eSTvrtko Ursulin enable &= ~BIT(I915_SAMPLE_BUSY); 126feff0dc6STvrtko Ursulin 127feff0dc6STvrtko Ursulin /* 128feff0dc6STvrtko Ursulin * If some bits remain it means we need the sampling timer running. 129feff0dc6STvrtko Ursulin */ 130feff0dc6STvrtko Ursulin return enable; 131feff0dc6STvrtko Ursulin } 132feff0dc6STvrtko Ursulin 133feff0dc6STvrtko Ursulin void i915_pmu_gt_parked(struct drm_i915_private *i915) 134feff0dc6STvrtko Ursulin { 135feff0dc6STvrtko Ursulin if (!i915->pmu.base.event_init) 136feff0dc6STvrtko Ursulin return; 137feff0dc6STvrtko Ursulin 138feff0dc6STvrtko Ursulin spin_lock_irq(&i915->pmu.lock); 139feff0dc6STvrtko Ursulin /* 140feff0dc6STvrtko Ursulin * Signal sampling timer to stop if only engine events are enabled and 141feff0dc6STvrtko Ursulin * GPU went idle. 142feff0dc6STvrtko Ursulin */ 143feff0dc6STvrtko Ursulin i915->pmu.timer_enabled = pmu_needs_timer(i915, false); 144feff0dc6STvrtko Ursulin spin_unlock_irq(&i915->pmu.lock); 145feff0dc6STvrtko Ursulin } 146feff0dc6STvrtko Ursulin 147feff0dc6STvrtko Ursulin static void __i915_pmu_maybe_start_timer(struct drm_i915_private *i915) 148feff0dc6STvrtko Ursulin { 149feff0dc6STvrtko Ursulin if (!i915->pmu.timer_enabled && pmu_needs_timer(i915, true)) { 150feff0dc6STvrtko Ursulin i915->pmu.timer_enabled = true; 151feff0dc6STvrtko Ursulin hrtimer_start_range_ns(&i915->pmu.timer, 152feff0dc6STvrtko Ursulin ns_to_ktime(PERIOD), 0, 153feff0dc6STvrtko Ursulin HRTIMER_MODE_REL_PINNED); 154feff0dc6STvrtko Ursulin } 155feff0dc6STvrtko Ursulin } 156feff0dc6STvrtko Ursulin 157feff0dc6STvrtko Ursulin void i915_pmu_gt_unparked(struct drm_i915_private *i915) 158feff0dc6STvrtko Ursulin { 159feff0dc6STvrtko Ursulin if (!i915->pmu.base.event_init) 160feff0dc6STvrtko Ursulin return; 161feff0dc6STvrtko Ursulin 162feff0dc6STvrtko Ursulin spin_lock_irq(&i915->pmu.lock); 163feff0dc6STvrtko Ursulin /* 164feff0dc6STvrtko Ursulin * Re-enable sampling timer when GPU goes active. 165feff0dc6STvrtko Ursulin */ 166feff0dc6STvrtko Ursulin __i915_pmu_maybe_start_timer(i915); 167feff0dc6STvrtko Ursulin spin_unlock_irq(&i915->pmu.lock); 168feff0dc6STvrtko Ursulin } 169feff0dc6STvrtko Ursulin 170b46a33e2STvrtko Ursulin static bool grab_forcewake(struct drm_i915_private *i915, bool fw) 171b46a33e2STvrtko Ursulin { 172b46a33e2STvrtko Ursulin if (!fw) 173b46a33e2STvrtko Ursulin intel_uncore_forcewake_get(i915, FORCEWAKE_ALL); 174b46a33e2STvrtko Ursulin 175b46a33e2STvrtko Ursulin return true; 176b46a33e2STvrtko Ursulin } 177b46a33e2STvrtko Ursulin 178b46a33e2STvrtko Ursulin static void 179b46a33e2STvrtko Ursulin update_sample(struct i915_pmu_sample *sample, u32 unit, u32 val) 180b46a33e2STvrtko Ursulin { 1818ee4f19cSTvrtko Ursulin sample->cur += mul_u32_u32(val, unit); 182b46a33e2STvrtko Ursulin } 183b46a33e2STvrtko Ursulin 184b46a33e2STvrtko Ursulin static void engines_sample(struct drm_i915_private *dev_priv) 185b46a33e2STvrtko Ursulin { 186b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 187b46a33e2STvrtko Ursulin enum intel_engine_id id; 188b46a33e2STvrtko Ursulin bool fw = false; 189b46a33e2STvrtko Ursulin 190b46a33e2STvrtko Ursulin if ((dev_priv->pmu.enable & ENGINE_SAMPLE_MASK) == 0) 191b46a33e2STvrtko Ursulin return; 192b46a33e2STvrtko Ursulin 193b46a33e2STvrtko Ursulin if (!dev_priv->gt.awake) 194b46a33e2STvrtko Ursulin return; 195b46a33e2STvrtko Ursulin 196b46a33e2STvrtko Ursulin if (!intel_runtime_pm_get_if_in_use(dev_priv)) 197b46a33e2STvrtko Ursulin return; 198b46a33e2STvrtko Ursulin 199b46a33e2STvrtko Ursulin for_each_engine(engine, dev_priv, id) { 200b46a33e2STvrtko Ursulin u32 current_seqno = intel_engine_get_seqno(engine); 201b46a33e2STvrtko Ursulin u32 last_seqno = intel_engine_last_submit(engine); 202b46a33e2STvrtko Ursulin u32 val; 203b46a33e2STvrtko Ursulin 204b46a33e2STvrtko Ursulin val = !i915_seqno_passed(current_seqno, last_seqno); 205b46a33e2STvrtko Ursulin 206b46a33e2STvrtko Ursulin update_sample(&engine->pmu.sample[I915_SAMPLE_BUSY], 207b46a33e2STvrtko Ursulin PERIOD, val); 208b46a33e2STvrtko Ursulin 209b46a33e2STvrtko Ursulin if (val && (engine->pmu.enable & 210b46a33e2STvrtko Ursulin (BIT(I915_SAMPLE_WAIT) | BIT(I915_SAMPLE_SEMA)))) { 211b46a33e2STvrtko Ursulin fw = grab_forcewake(dev_priv, fw); 212b46a33e2STvrtko Ursulin 213b46a33e2STvrtko Ursulin val = I915_READ_FW(RING_CTL(engine->mmio_base)); 214b46a33e2STvrtko Ursulin } else { 215b46a33e2STvrtko Ursulin val = 0; 216b46a33e2STvrtko Ursulin } 217b46a33e2STvrtko Ursulin 218b46a33e2STvrtko Ursulin update_sample(&engine->pmu.sample[I915_SAMPLE_WAIT], 219b46a33e2STvrtko Ursulin PERIOD, !!(val & RING_WAIT)); 220b46a33e2STvrtko Ursulin 221b46a33e2STvrtko Ursulin update_sample(&engine->pmu.sample[I915_SAMPLE_SEMA], 222b46a33e2STvrtko Ursulin PERIOD, !!(val & RING_WAIT_SEMAPHORE)); 223b46a33e2STvrtko Ursulin } 224b46a33e2STvrtko Ursulin 225b46a33e2STvrtko Ursulin if (fw) 226b46a33e2STvrtko Ursulin intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL); 227b46a33e2STvrtko Ursulin 228b46a33e2STvrtko Ursulin intel_runtime_pm_put(dev_priv); 229b46a33e2STvrtko Ursulin } 230b46a33e2STvrtko Ursulin 231b46a33e2STvrtko Ursulin static void frequency_sample(struct drm_i915_private *dev_priv) 232b46a33e2STvrtko Ursulin { 233b46a33e2STvrtko Ursulin if (dev_priv->pmu.enable & 234b46a33e2STvrtko Ursulin config_enabled_mask(I915_PMU_ACTUAL_FREQUENCY)) { 235b46a33e2STvrtko Ursulin u32 val; 236b46a33e2STvrtko Ursulin 237b46a33e2STvrtko Ursulin val = dev_priv->gt_pm.rps.cur_freq; 238b46a33e2STvrtko Ursulin if (dev_priv->gt.awake && 239b46a33e2STvrtko Ursulin intel_runtime_pm_get_if_in_use(dev_priv)) { 240b46a33e2STvrtko Ursulin val = intel_get_cagf(dev_priv, 241b46a33e2STvrtko Ursulin I915_READ_NOTRACE(GEN6_RPSTAT1)); 242b46a33e2STvrtko Ursulin intel_runtime_pm_put(dev_priv); 243b46a33e2STvrtko Ursulin } 244b46a33e2STvrtko Ursulin 245b46a33e2STvrtko Ursulin update_sample(&dev_priv->pmu.sample[__I915_SAMPLE_FREQ_ACT], 246b46a33e2STvrtko Ursulin 1, intel_gpu_freq(dev_priv, val)); 247b46a33e2STvrtko Ursulin } 248b46a33e2STvrtko Ursulin 249b46a33e2STvrtko Ursulin if (dev_priv->pmu.enable & 250b46a33e2STvrtko Ursulin config_enabled_mask(I915_PMU_REQUESTED_FREQUENCY)) { 251b46a33e2STvrtko Ursulin update_sample(&dev_priv->pmu.sample[__I915_SAMPLE_FREQ_REQ], 1, 252b46a33e2STvrtko Ursulin intel_gpu_freq(dev_priv, 253b46a33e2STvrtko Ursulin dev_priv->gt_pm.rps.cur_freq)); 254b46a33e2STvrtko Ursulin } 255b46a33e2STvrtko Ursulin } 256b46a33e2STvrtko Ursulin 257b46a33e2STvrtko Ursulin static enum hrtimer_restart i915_sample(struct hrtimer *hrtimer) 258b46a33e2STvrtko Ursulin { 259b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 260b46a33e2STvrtko Ursulin container_of(hrtimer, struct drm_i915_private, pmu.timer); 261b46a33e2STvrtko Ursulin 2628ee4f19cSTvrtko Ursulin if (!READ_ONCE(i915->pmu.timer_enabled)) 263b46a33e2STvrtko Ursulin return HRTIMER_NORESTART; 264b46a33e2STvrtko Ursulin 265b46a33e2STvrtko Ursulin engines_sample(i915); 266b46a33e2STvrtko Ursulin frequency_sample(i915); 267b46a33e2STvrtko Ursulin 268b46a33e2STvrtko Ursulin hrtimer_forward_now(hrtimer, ns_to_ktime(PERIOD)); 269b46a33e2STvrtko Ursulin return HRTIMER_RESTART; 270b46a33e2STvrtko Ursulin } 271b46a33e2STvrtko Ursulin 2720cd4684dSTvrtko Ursulin static u64 count_interrupts(struct drm_i915_private *i915) 2730cd4684dSTvrtko Ursulin { 2740cd4684dSTvrtko Ursulin /* open-coded kstat_irqs() */ 2750cd4684dSTvrtko Ursulin struct irq_desc *desc = irq_to_desc(i915->drm.pdev->irq); 2760cd4684dSTvrtko Ursulin u64 sum = 0; 2770cd4684dSTvrtko Ursulin int cpu; 2780cd4684dSTvrtko Ursulin 2790cd4684dSTvrtko Ursulin if (!desc || !desc->kstat_irqs) 2800cd4684dSTvrtko Ursulin return 0; 2810cd4684dSTvrtko Ursulin 2820cd4684dSTvrtko Ursulin for_each_possible_cpu(cpu) 2830cd4684dSTvrtko Ursulin sum += *per_cpu_ptr(desc->kstat_irqs, cpu); 2840cd4684dSTvrtko Ursulin 2850cd4684dSTvrtko Ursulin return sum; 2860cd4684dSTvrtko Ursulin } 2870cd4684dSTvrtko Ursulin 288b46a33e2STvrtko Ursulin static void i915_pmu_event_destroy(struct perf_event *event) 289b46a33e2STvrtko Ursulin { 290b46a33e2STvrtko Ursulin WARN_ON(event->parent); 291b46a33e2STvrtko Ursulin } 292b46a33e2STvrtko Ursulin 293*109ec558STvrtko Ursulin static int 294*109ec558STvrtko Ursulin engine_event_status(struct intel_engine_cs *engine, 295*109ec558STvrtko Ursulin enum drm_i915_pmu_engine_sample sample) 296b46a33e2STvrtko Ursulin { 297*109ec558STvrtko Ursulin switch (sample) { 298b46a33e2STvrtko Ursulin case I915_SAMPLE_BUSY: 299b46a33e2STvrtko Ursulin case I915_SAMPLE_WAIT: 300b46a33e2STvrtko Ursulin break; 301b46a33e2STvrtko Ursulin case I915_SAMPLE_SEMA: 302*109ec558STvrtko Ursulin if (INTEL_GEN(engine->i915) < 6) 303b46a33e2STvrtko Ursulin return -ENODEV; 304b46a33e2STvrtko Ursulin break; 305b46a33e2STvrtko Ursulin default: 306b46a33e2STvrtko Ursulin return -ENOENT; 307b46a33e2STvrtko Ursulin } 308b46a33e2STvrtko Ursulin 309b46a33e2STvrtko Ursulin return 0; 310b46a33e2STvrtko Ursulin } 311b46a33e2STvrtko Ursulin 312*109ec558STvrtko Ursulin static int 313*109ec558STvrtko Ursulin config_status(struct drm_i915_private *i915, u64 config) 314*109ec558STvrtko Ursulin { 315*109ec558STvrtko Ursulin switch (config) { 316*109ec558STvrtko Ursulin case I915_PMU_ACTUAL_FREQUENCY: 317*109ec558STvrtko Ursulin if (IS_VALLEYVIEW(i915) || IS_CHERRYVIEW(i915)) 318*109ec558STvrtko Ursulin /* Requires a mutex for sampling! */ 319*109ec558STvrtko Ursulin return -ENODEV; 320*109ec558STvrtko Ursulin /* Fall-through. */ 321*109ec558STvrtko Ursulin case I915_PMU_REQUESTED_FREQUENCY: 322*109ec558STvrtko Ursulin if (INTEL_GEN(i915) < 6) 323*109ec558STvrtko Ursulin return -ENODEV; 324*109ec558STvrtko Ursulin break; 325*109ec558STvrtko Ursulin case I915_PMU_INTERRUPTS: 326*109ec558STvrtko Ursulin break; 327*109ec558STvrtko Ursulin case I915_PMU_RC6_RESIDENCY: 328*109ec558STvrtko Ursulin if (!HAS_RC6(i915)) 329*109ec558STvrtko Ursulin return -ENODEV; 330*109ec558STvrtko Ursulin break; 331*109ec558STvrtko Ursulin default: 332*109ec558STvrtko Ursulin return -ENOENT; 333*109ec558STvrtko Ursulin } 334*109ec558STvrtko Ursulin 335*109ec558STvrtko Ursulin return 0; 336*109ec558STvrtko Ursulin } 337*109ec558STvrtko Ursulin 338*109ec558STvrtko Ursulin static int engine_event_init(struct perf_event *event) 339*109ec558STvrtko Ursulin { 340*109ec558STvrtko Ursulin struct drm_i915_private *i915 = 341*109ec558STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 342*109ec558STvrtko Ursulin struct intel_engine_cs *engine; 343*109ec558STvrtko Ursulin 344*109ec558STvrtko Ursulin engine = intel_engine_lookup_user(i915, engine_event_class(event), 345*109ec558STvrtko Ursulin engine_event_instance(event)); 346*109ec558STvrtko Ursulin if (!engine) 347*109ec558STvrtko Ursulin return -ENODEV; 348*109ec558STvrtko Ursulin 349*109ec558STvrtko Ursulin return engine_event_status(engine, engine_event_sample(event)); 350*109ec558STvrtko Ursulin } 351*109ec558STvrtko Ursulin 352b46a33e2STvrtko Ursulin static int i915_pmu_event_init(struct perf_event *event) 353b46a33e2STvrtko Ursulin { 354b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 355b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 3560426c046STvrtko Ursulin int ret; 357b46a33e2STvrtko Ursulin 358b46a33e2STvrtko Ursulin if (event->attr.type != event->pmu->type) 359b46a33e2STvrtko Ursulin return -ENOENT; 360b46a33e2STvrtko Ursulin 361b46a33e2STvrtko Ursulin /* unsupported modes and filters */ 362b46a33e2STvrtko Ursulin if (event->attr.sample_period) /* no sampling */ 363b46a33e2STvrtko Ursulin return -EINVAL; 364b46a33e2STvrtko Ursulin 365b46a33e2STvrtko Ursulin if (has_branch_stack(event)) 366b46a33e2STvrtko Ursulin return -EOPNOTSUPP; 367b46a33e2STvrtko Ursulin 368b46a33e2STvrtko Ursulin if (event->cpu < 0) 369b46a33e2STvrtko Ursulin return -EINVAL; 370b46a33e2STvrtko Ursulin 3710426c046STvrtko Ursulin /* only allow running on one cpu at a time */ 3720426c046STvrtko Ursulin if (!cpumask_test_cpu(event->cpu, &i915_pmu_cpumask)) 37300a79722STvrtko Ursulin return -EINVAL; 374b46a33e2STvrtko Ursulin 375*109ec558STvrtko Ursulin if (is_engine_event(event)) 376b46a33e2STvrtko Ursulin ret = engine_event_init(event); 377*109ec558STvrtko Ursulin else 378*109ec558STvrtko Ursulin ret = config_status(i915, event->attr.config); 379b46a33e2STvrtko Ursulin if (ret) 380b46a33e2STvrtko Ursulin return ret; 381b46a33e2STvrtko Ursulin 382b46a33e2STvrtko Ursulin if (!event->parent) 383b46a33e2STvrtko Ursulin event->destroy = i915_pmu_event_destroy; 384b46a33e2STvrtko Ursulin 385b46a33e2STvrtko Ursulin return 0; 386b46a33e2STvrtko Ursulin } 387b46a33e2STvrtko Ursulin 388b46a33e2STvrtko Ursulin static u64 __i915_pmu_event_read(struct perf_event *event) 389b46a33e2STvrtko Ursulin { 390b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 391b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 392b46a33e2STvrtko Ursulin u64 val = 0; 393b46a33e2STvrtko Ursulin 394b46a33e2STvrtko Ursulin if (is_engine_event(event)) { 395b46a33e2STvrtko Ursulin u8 sample = engine_event_sample(event); 396b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 397b46a33e2STvrtko Ursulin 398b46a33e2STvrtko Ursulin engine = intel_engine_lookup_user(i915, 399b46a33e2STvrtko Ursulin engine_event_class(event), 400b46a33e2STvrtko Ursulin engine_event_instance(event)); 401b46a33e2STvrtko Ursulin 402b46a33e2STvrtko Ursulin if (WARN_ON_ONCE(!engine)) { 403b46a33e2STvrtko Ursulin /* Do nothing */ 404b3add01eSTvrtko Ursulin } else if (sample == I915_SAMPLE_BUSY && 405b3add01eSTvrtko Ursulin engine->pmu.busy_stats) { 406b3add01eSTvrtko Ursulin val = ktime_to_ns(intel_engine_get_busy_time(engine)); 407b46a33e2STvrtko Ursulin } else { 408b46a33e2STvrtko Ursulin val = engine->pmu.sample[sample].cur; 409b46a33e2STvrtko Ursulin } 410b46a33e2STvrtko Ursulin } else { 411b46a33e2STvrtko Ursulin switch (event->attr.config) { 412b46a33e2STvrtko Ursulin case I915_PMU_ACTUAL_FREQUENCY: 413b46a33e2STvrtko Ursulin val = 414b46a33e2STvrtko Ursulin div_u64(i915->pmu.sample[__I915_SAMPLE_FREQ_ACT].cur, 415b46a33e2STvrtko Ursulin FREQUENCY); 416b46a33e2STvrtko Ursulin break; 417b46a33e2STvrtko Ursulin case I915_PMU_REQUESTED_FREQUENCY: 418b46a33e2STvrtko Ursulin val = 419b46a33e2STvrtko Ursulin div_u64(i915->pmu.sample[__I915_SAMPLE_FREQ_REQ].cur, 420b46a33e2STvrtko Ursulin FREQUENCY); 421b46a33e2STvrtko Ursulin break; 4220cd4684dSTvrtko Ursulin case I915_PMU_INTERRUPTS: 4230cd4684dSTvrtko Ursulin val = count_interrupts(i915); 4240cd4684dSTvrtko Ursulin break; 4256060b6aeSTvrtko Ursulin case I915_PMU_RC6_RESIDENCY: 4266060b6aeSTvrtko Ursulin intel_runtime_pm_get(i915); 4276060b6aeSTvrtko Ursulin val = intel_rc6_residency_ns(i915, 4286060b6aeSTvrtko Ursulin IS_VALLEYVIEW(i915) ? 4296060b6aeSTvrtko Ursulin VLV_GT_RENDER_RC6 : 4306060b6aeSTvrtko Ursulin GEN6_GT_GFX_RC6); 431fb6db0f5SChris Wilson if (HAS_RC6p(i915)) 4323452fa30STvrtko Ursulin val += intel_rc6_residency_ns(i915, 4333452fa30STvrtko Ursulin GEN6_GT_GFX_RC6p); 434fb6db0f5SChris Wilson if (HAS_RC6pp(i915)) 4353452fa30STvrtko Ursulin val += intel_rc6_residency_ns(i915, 4363452fa30STvrtko Ursulin GEN6_GT_GFX_RC6pp); 4376060b6aeSTvrtko Ursulin intel_runtime_pm_put(i915); 4386060b6aeSTvrtko Ursulin break; 439b46a33e2STvrtko Ursulin } 440b46a33e2STvrtko Ursulin } 441b46a33e2STvrtko Ursulin 442b46a33e2STvrtko Ursulin return val; 443b46a33e2STvrtko Ursulin } 444b46a33e2STvrtko Ursulin 445b46a33e2STvrtko Ursulin static void i915_pmu_event_read(struct perf_event *event) 446b46a33e2STvrtko Ursulin { 447b46a33e2STvrtko Ursulin struct hw_perf_event *hwc = &event->hw; 448b46a33e2STvrtko Ursulin u64 prev, new; 449b46a33e2STvrtko Ursulin 450b46a33e2STvrtko Ursulin again: 451b46a33e2STvrtko Ursulin prev = local64_read(&hwc->prev_count); 452b46a33e2STvrtko Ursulin new = __i915_pmu_event_read(event); 453b46a33e2STvrtko Ursulin 454b46a33e2STvrtko Ursulin if (local64_cmpxchg(&hwc->prev_count, prev, new) != prev) 455b46a33e2STvrtko Ursulin goto again; 456b46a33e2STvrtko Ursulin 457b46a33e2STvrtko Ursulin local64_add(new - prev, &event->count); 458b46a33e2STvrtko Ursulin } 459b46a33e2STvrtko Ursulin 460b3add01eSTvrtko Ursulin static bool engine_needs_busy_stats(struct intel_engine_cs *engine) 461b3add01eSTvrtko Ursulin { 462cf669b4eSTvrtko Ursulin return intel_engine_supports_stats(engine) && 463b3add01eSTvrtko Ursulin (engine->pmu.enable & BIT(I915_SAMPLE_BUSY)); 464b3add01eSTvrtko Ursulin } 465b3add01eSTvrtko Ursulin 466b46a33e2STvrtko Ursulin static void i915_pmu_enable(struct perf_event *event) 467b46a33e2STvrtko Ursulin { 468b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 469b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 470b46a33e2STvrtko Ursulin unsigned int bit = event_enabled_bit(event); 471b46a33e2STvrtko Ursulin unsigned long flags; 472b46a33e2STvrtko Ursulin 473b46a33e2STvrtko Ursulin spin_lock_irqsave(&i915->pmu.lock, flags); 474b46a33e2STvrtko Ursulin 475b46a33e2STvrtko Ursulin /* 476b46a33e2STvrtko Ursulin * Update the bitmask of enabled events and increment 477b46a33e2STvrtko Ursulin * the event reference counter. 478b46a33e2STvrtko Ursulin */ 479b46a33e2STvrtko Ursulin GEM_BUG_ON(bit >= I915_PMU_MASK_BITS); 480b46a33e2STvrtko Ursulin GEM_BUG_ON(i915->pmu.enable_count[bit] == ~0); 481b46a33e2STvrtko Ursulin i915->pmu.enable |= BIT_ULL(bit); 482b46a33e2STvrtko Ursulin i915->pmu.enable_count[bit]++; 483b46a33e2STvrtko Ursulin 484b46a33e2STvrtko Ursulin /* 485feff0dc6STvrtko Ursulin * Start the sampling timer if needed and not already enabled. 486feff0dc6STvrtko Ursulin */ 487feff0dc6STvrtko Ursulin __i915_pmu_maybe_start_timer(i915); 488feff0dc6STvrtko Ursulin 489feff0dc6STvrtko Ursulin /* 490b46a33e2STvrtko Ursulin * For per-engine events the bitmask and reference counting 491b46a33e2STvrtko Ursulin * is stored per engine. 492b46a33e2STvrtko Ursulin */ 493b46a33e2STvrtko Ursulin if (is_engine_event(event)) { 494b46a33e2STvrtko Ursulin u8 sample = engine_event_sample(event); 495b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 496b46a33e2STvrtko Ursulin 497b46a33e2STvrtko Ursulin engine = intel_engine_lookup_user(i915, 498b46a33e2STvrtko Ursulin engine_event_class(event), 499b46a33e2STvrtko Ursulin engine_event_instance(event)); 500b46a33e2STvrtko Ursulin GEM_BUG_ON(!engine); 501b46a33e2STvrtko Ursulin engine->pmu.enable |= BIT(sample); 502b46a33e2STvrtko Ursulin 503b46a33e2STvrtko Ursulin GEM_BUG_ON(sample >= I915_PMU_SAMPLE_BITS); 504b46a33e2STvrtko Ursulin GEM_BUG_ON(engine->pmu.enable_count[sample] == ~0); 505b3add01eSTvrtko Ursulin if (engine->pmu.enable_count[sample]++ == 0) { 506b3add01eSTvrtko Ursulin /* 507b3add01eSTvrtko Ursulin * Enable engine busy stats tracking if needed or 508b3add01eSTvrtko Ursulin * alternatively cancel the scheduled disable. 509b3add01eSTvrtko Ursulin * 510b3add01eSTvrtko Ursulin * If the delayed disable was pending, cancel it and 511b3add01eSTvrtko Ursulin * in this case do not enable since it already is. 512b3add01eSTvrtko Ursulin */ 513b3add01eSTvrtko Ursulin if (engine_needs_busy_stats(engine) && 514b3add01eSTvrtko Ursulin !engine->pmu.busy_stats) { 515b3add01eSTvrtko Ursulin engine->pmu.busy_stats = true; 516b3add01eSTvrtko Ursulin if (!cancel_delayed_work(&engine->pmu.disable_busy_stats)) 517b3add01eSTvrtko Ursulin intel_enable_engine_stats(engine); 518b3add01eSTvrtko Ursulin } 519b3add01eSTvrtko Ursulin } 520b46a33e2STvrtko Ursulin } 521b46a33e2STvrtko Ursulin 522b46a33e2STvrtko Ursulin /* 523b46a33e2STvrtko Ursulin * Store the current counter value so we can report the correct delta 524b46a33e2STvrtko Ursulin * for all listeners. Even when the event was already enabled and has 525b46a33e2STvrtko Ursulin * an existing non-zero value. 526b46a33e2STvrtko Ursulin */ 527b46a33e2STvrtko Ursulin local64_set(&event->hw.prev_count, __i915_pmu_event_read(event)); 528b46a33e2STvrtko Ursulin 529b46a33e2STvrtko Ursulin spin_unlock_irqrestore(&i915->pmu.lock, flags); 530b46a33e2STvrtko Ursulin } 531b46a33e2STvrtko Ursulin 532b3add01eSTvrtko Ursulin static void __disable_busy_stats(struct work_struct *work) 533b3add01eSTvrtko Ursulin { 534b3add01eSTvrtko Ursulin struct intel_engine_cs *engine = 535b3add01eSTvrtko Ursulin container_of(work, typeof(*engine), pmu.disable_busy_stats.work); 536b3add01eSTvrtko Ursulin 537b3add01eSTvrtko Ursulin intel_disable_engine_stats(engine); 538b3add01eSTvrtko Ursulin } 539b3add01eSTvrtko Ursulin 540b46a33e2STvrtko Ursulin static void i915_pmu_disable(struct perf_event *event) 541b46a33e2STvrtko Ursulin { 542b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 543b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 544b46a33e2STvrtko Ursulin unsigned int bit = event_enabled_bit(event); 545b46a33e2STvrtko Ursulin unsigned long flags; 546b46a33e2STvrtko Ursulin 547b46a33e2STvrtko Ursulin spin_lock_irqsave(&i915->pmu.lock, flags); 548b46a33e2STvrtko Ursulin 549b46a33e2STvrtko Ursulin if (is_engine_event(event)) { 550b46a33e2STvrtko Ursulin u8 sample = engine_event_sample(event); 551b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 552b46a33e2STvrtko Ursulin 553b46a33e2STvrtko Ursulin engine = intel_engine_lookup_user(i915, 554b46a33e2STvrtko Ursulin engine_event_class(event), 555b46a33e2STvrtko Ursulin engine_event_instance(event)); 556b46a33e2STvrtko Ursulin GEM_BUG_ON(!engine); 557b46a33e2STvrtko Ursulin GEM_BUG_ON(sample >= I915_PMU_SAMPLE_BITS); 558b46a33e2STvrtko Ursulin GEM_BUG_ON(engine->pmu.enable_count[sample] == 0); 559b46a33e2STvrtko Ursulin /* 560b46a33e2STvrtko Ursulin * Decrement the reference count and clear the enabled 561b46a33e2STvrtko Ursulin * bitmask when the last listener on an event goes away. 562b46a33e2STvrtko Ursulin */ 563b3add01eSTvrtko Ursulin if (--engine->pmu.enable_count[sample] == 0) { 564b46a33e2STvrtko Ursulin engine->pmu.enable &= ~BIT(sample); 565b3add01eSTvrtko Ursulin if (!engine_needs_busy_stats(engine) && 566b3add01eSTvrtko Ursulin engine->pmu.busy_stats) { 567b3add01eSTvrtko Ursulin engine->pmu.busy_stats = false; 568b3add01eSTvrtko Ursulin /* 569b3add01eSTvrtko Ursulin * We request a delayed disable to handle the 570b3add01eSTvrtko Ursulin * rapid on/off cycles on events, which can 571b3add01eSTvrtko Ursulin * happen when tools like perf stat start, in a 572b3add01eSTvrtko Ursulin * nicer way. 573b3add01eSTvrtko Ursulin * 574b3add01eSTvrtko Ursulin * In addition, this also helps with busy stats 575b3add01eSTvrtko Ursulin * accuracy with background CPU offline/online 576b3add01eSTvrtko Ursulin * migration events. 577b3add01eSTvrtko Ursulin */ 578b3add01eSTvrtko Ursulin queue_delayed_work(system_wq, 579b3add01eSTvrtko Ursulin &engine->pmu.disable_busy_stats, 580b3add01eSTvrtko Ursulin round_jiffies_up_relative(HZ)); 581b3add01eSTvrtko Ursulin } 582b3add01eSTvrtko Ursulin } 583b46a33e2STvrtko Ursulin } 584b46a33e2STvrtko Ursulin 585b46a33e2STvrtko Ursulin GEM_BUG_ON(bit >= I915_PMU_MASK_BITS); 586b46a33e2STvrtko Ursulin GEM_BUG_ON(i915->pmu.enable_count[bit] == 0); 587b46a33e2STvrtko Ursulin /* 588b46a33e2STvrtko Ursulin * Decrement the reference count and clear the enabled 589b46a33e2STvrtko Ursulin * bitmask when the last listener on an event goes away. 590b46a33e2STvrtko Ursulin */ 591feff0dc6STvrtko Ursulin if (--i915->pmu.enable_count[bit] == 0) { 592b46a33e2STvrtko Ursulin i915->pmu.enable &= ~BIT_ULL(bit); 593feff0dc6STvrtko Ursulin i915->pmu.timer_enabled &= pmu_needs_timer(i915, true); 594feff0dc6STvrtko Ursulin } 595b46a33e2STvrtko Ursulin 596b46a33e2STvrtko Ursulin spin_unlock_irqrestore(&i915->pmu.lock, flags); 597b46a33e2STvrtko Ursulin } 598b46a33e2STvrtko Ursulin 599b46a33e2STvrtko Ursulin static void i915_pmu_event_start(struct perf_event *event, int flags) 600b46a33e2STvrtko Ursulin { 601b46a33e2STvrtko Ursulin i915_pmu_enable(event); 602b46a33e2STvrtko Ursulin event->hw.state = 0; 603b46a33e2STvrtko Ursulin } 604b46a33e2STvrtko Ursulin 605b46a33e2STvrtko Ursulin static void i915_pmu_event_stop(struct perf_event *event, int flags) 606b46a33e2STvrtko Ursulin { 607b46a33e2STvrtko Ursulin if (flags & PERF_EF_UPDATE) 608b46a33e2STvrtko Ursulin i915_pmu_event_read(event); 609b46a33e2STvrtko Ursulin i915_pmu_disable(event); 610b46a33e2STvrtko Ursulin event->hw.state = PERF_HES_STOPPED; 611b46a33e2STvrtko Ursulin } 612b46a33e2STvrtko Ursulin 613b46a33e2STvrtko Ursulin static int i915_pmu_event_add(struct perf_event *event, int flags) 614b46a33e2STvrtko Ursulin { 615b46a33e2STvrtko Ursulin if (flags & PERF_EF_START) 616b46a33e2STvrtko Ursulin i915_pmu_event_start(event, flags); 617b46a33e2STvrtko Ursulin 618b46a33e2STvrtko Ursulin return 0; 619b46a33e2STvrtko Ursulin } 620b46a33e2STvrtko Ursulin 621b46a33e2STvrtko Ursulin static void i915_pmu_event_del(struct perf_event *event, int flags) 622b46a33e2STvrtko Ursulin { 623b46a33e2STvrtko Ursulin i915_pmu_event_stop(event, PERF_EF_UPDATE); 624b46a33e2STvrtko Ursulin } 625b46a33e2STvrtko Ursulin 626b46a33e2STvrtko Ursulin static int i915_pmu_event_event_idx(struct perf_event *event) 627b46a33e2STvrtko Ursulin { 628b46a33e2STvrtko Ursulin return 0; 629b46a33e2STvrtko Ursulin } 630b46a33e2STvrtko Ursulin 631b7d3aabfSChris Wilson struct i915_str_attribute { 632b7d3aabfSChris Wilson struct device_attribute attr; 633b7d3aabfSChris Wilson const char *str; 634b7d3aabfSChris Wilson }; 635b7d3aabfSChris Wilson 636b46a33e2STvrtko Ursulin static ssize_t i915_pmu_format_show(struct device *dev, 637b46a33e2STvrtko Ursulin struct device_attribute *attr, char *buf) 638b46a33e2STvrtko Ursulin { 639b7d3aabfSChris Wilson struct i915_str_attribute *eattr; 640b46a33e2STvrtko Ursulin 641b7d3aabfSChris Wilson eattr = container_of(attr, struct i915_str_attribute, attr); 642b7d3aabfSChris Wilson return sprintf(buf, "%s\n", eattr->str); 643b46a33e2STvrtko Ursulin } 644b46a33e2STvrtko Ursulin 645b46a33e2STvrtko Ursulin #define I915_PMU_FORMAT_ATTR(_name, _config) \ 646b7d3aabfSChris Wilson (&((struct i915_str_attribute[]) { \ 647b46a33e2STvrtko Ursulin { .attr = __ATTR(_name, 0444, i915_pmu_format_show, NULL), \ 648b7d3aabfSChris Wilson .str = _config, } \ 649b46a33e2STvrtko Ursulin })[0].attr.attr) 650b46a33e2STvrtko Ursulin 651b46a33e2STvrtko Ursulin static struct attribute *i915_pmu_format_attrs[] = { 652b46a33e2STvrtko Ursulin I915_PMU_FORMAT_ATTR(i915_eventid, "config:0-20"), 653b46a33e2STvrtko Ursulin NULL, 654b46a33e2STvrtko Ursulin }; 655b46a33e2STvrtko Ursulin 656b46a33e2STvrtko Ursulin static const struct attribute_group i915_pmu_format_attr_group = { 657b46a33e2STvrtko Ursulin .name = "format", 658b46a33e2STvrtko Ursulin .attrs = i915_pmu_format_attrs, 659b46a33e2STvrtko Ursulin }; 660b46a33e2STvrtko Ursulin 661b7d3aabfSChris Wilson struct i915_ext_attribute { 662b7d3aabfSChris Wilson struct device_attribute attr; 663b7d3aabfSChris Wilson unsigned long val; 664b7d3aabfSChris Wilson }; 665b7d3aabfSChris Wilson 666b46a33e2STvrtko Ursulin static ssize_t i915_pmu_event_show(struct device *dev, 667b46a33e2STvrtko Ursulin struct device_attribute *attr, char *buf) 668b46a33e2STvrtko Ursulin { 669b7d3aabfSChris Wilson struct i915_ext_attribute *eattr; 670b46a33e2STvrtko Ursulin 671b7d3aabfSChris Wilson eattr = container_of(attr, struct i915_ext_attribute, attr); 672b7d3aabfSChris Wilson return sprintf(buf, "config=0x%lx\n", eattr->val); 673b46a33e2STvrtko Ursulin } 674b46a33e2STvrtko Ursulin 675*109ec558STvrtko Ursulin static struct attribute_group i915_pmu_events_attr_group = { 676b46a33e2STvrtko Ursulin .name = "events", 677*109ec558STvrtko Ursulin /* Patch in attrs at runtime. */ 678b46a33e2STvrtko Ursulin }; 679b46a33e2STvrtko Ursulin 680b46a33e2STvrtko Ursulin static ssize_t 681b46a33e2STvrtko Ursulin i915_pmu_get_attr_cpumask(struct device *dev, 682b46a33e2STvrtko Ursulin struct device_attribute *attr, 683b46a33e2STvrtko Ursulin char *buf) 684b46a33e2STvrtko Ursulin { 685b46a33e2STvrtko Ursulin return cpumap_print_to_pagebuf(true, buf, &i915_pmu_cpumask); 686b46a33e2STvrtko Ursulin } 687b46a33e2STvrtko Ursulin 688b46a33e2STvrtko Ursulin static DEVICE_ATTR(cpumask, 0444, i915_pmu_get_attr_cpumask, NULL); 689b46a33e2STvrtko Ursulin 690b46a33e2STvrtko Ursulin static struct attribute *i915_cpumask_attrs[] = { 691b46a33e2STvrtko Ursulin &dev_attr_cpumask.attr, 692b46a33e2STvrtko Ursulin NULL, 693b46a33e2STvrtko Ursulin }; 694b46a33e2STvrtko Ursulin 695*109ec558STvrtko Ursulin static const struct attribute_group i915_pmu_cpumask_attr_group = { 696b46a33e2STvrtko Ursulin .attrs = i915_cpumask_attrs, 697b46a33e2STvrtko Ursulin }; 698b46a33e2STvrtko Ursulin 699b46a33e2STvrtko Ursulin static const struct attribute_group *i915_pmu_attr_groups[] = { 700b46a33e2STvrtko Ursulin &i915_pmu_format_attr_group, 701b46a33e2STvrtko Ursulin &i915_pmu_events_attr_group, 702b46a33e2STvrtko Ursulin &i915_pmu_cpumask_attr_group, 703b46a33e2STvrtko Ursulin NULL 704b46a33e2STvrtko Ursulin }; 705b46a33e2STvrtko Ursulin 706*109ec558STvrtko Ursulin #define __event(__config, __name, __unit) \ 707*109ec558STvrtko Ursulin { \ 708*109ec558STvrtko Ursulin .config = (__config), \ 709*109ec558STvrtko Ursulin .name = (__name), \ 710*109ec558STvrtko Ursulin .unit = (__unit), \ 711*109ec558STvrtko Ursulin } 712*109ec558STvrtko Ursulin 713*109ec558STvrtko Ursulin #define __engine_event(__sample, __name) \ 714*109ec558STvrtko Ursulin { \ 715*109ec558STvrtko Ursulin .sample = (__sample), \ 716*109ec558STvrtko Ursulin .name = (__name), \ 717*109ec558STvrtko Ursulin } 718*109ec558STvrtko Ursulin 719*109ec558STvrtko Ursulin static struct i915_ext_attribute * 720*109ec558STvrtko Ursulin add_i915_attr(struct i915_ext_attribute *attr, const char *name, u64 config) 721*109ec558STvrtko Ursulin { 722*109ec558STvrtko Ursulin attr->attr.attr.name = name; 723*109ec558STvrtko Ursulin attr->attr.attr.mode = 0444; 724*109ec558STvrtko Ursulin attr->attr.show = i915_pmu_event_show; 725*109ec558STvrtko Ursulin attr->val = config; 726*109ec558STvrtko Ursulin 727*109ec558STvrtko Ursulin return ++attr; 728*109ec558STvrtko Ursulin } 729*109ec558STvrtko Ursulin 730*109ec558STvrtko Ursulin static struct perf_pmu_events_attr * 731*109ec558STvrtko Ursulin add_pmu_attr(struct perf_pmu_events_attr *attr, const char *name, 732*109ec558STvrtko Ursulin const char *str) 733*109ec558STvrtko Ursulin { 734*109ec558STvrtko Ursulin attr->attr.attr.name = name; 735*109ec558STvrtko Ursulin attr->attr.attr.mode = 0444; 736*109ec558STvrtko Ursulin attr->attr.show = perf_event_sysfs_show; 737*109ec558STvrtko Ursulin attr->event_str = str; 738*109ec558STvrtko Ursulin 739*109ec558STvrtko Ursulin return ++attr; 740*109ec558STvrtko Ursulin } 741*109ec558STvrtko Ursulin 742*109ec558STvrtko Ursulin static struct attribute ** 743*109ec558STvrtko Ursulin create_event_attributes(struct drm_i915_private *i915) 744*109ec558STvrtko Ursulin { 745*109ec558STvrtko Ursulin static const struct { 746*109ec558STvrtko Ursulin u64 config; 747*109ec558STvrtko Ursulin const char *name; 748*109ec558STvrtko Ursulin const char *unit; 749*109ec558STvrtko Ursulin } events[] = { 750*109ec558STvrtko Ursulin __event(I915_PMU_ACTUAL_FREQUENCY, "actual-frequency", "MHz"), 751*109ec558STvrtko Ursulin __event(I915_PMU_REQUESTED_FREQUENCY, "requested-frequency", "MHz"), 752*109ec558STvrtko Ursulin __event(I915_PMU_INTERRUPTS, "interrupts", NULL), 753*109ec558STvrtko Ursulin __event(I915_PMU_RC6_RESIDENCY, "rc6-residency", "ns"), 754*109ec558STvrtko Ursulin }; 755*109ec558STvrtko Ursulin static const struct { 756*109ec558STvrtko Ursulin enum drm_i915_pmu_engine_sample sample; 757*109ec558STvrtko Ursulin char *name; 758*109ec558STvrtko Ursulin } engine_events[] = { 759*109ec558STvrtko Ursulin __engine_event(I915_SAMPLE_BUSY, "busy"), 760*109ec558STvrtko Ursulin __engine_event(I915_SAMPLE_SEMA, "sema"), 761*109ec558STvrtko Ursulin __engine_event(I915_SAMPLE_WAIT, "wait"), 762*109ec558STvrtko Ursulin }; 763*109ec558STvrtko Ursulin unsigned int count = 0; 764*109ec558STvrtko Ursulin struct perf_pmu_events_attr *pmu_attr = NULL, *pmu_iter; 765*109ec558STvrtko Ursulin struct i915_ext_attribute *i915_attr = NULL, *i915_iter; 766*109ec558STvrtko Ursulin struct attribute **attr = NULL, **attr_iter; 767*109ec558STvrtko Ursulin struct intel_engine_cs *engine; 768*109ec558STvrtko Ursulin enum intel_engine_id id; 769*109ec558STvrtko Ursulin unsigned int i; 770*109ec558STvrtko Ursulin 771*109ec558STvrtko Ursulin /* Count how many counters we will be exposing. */ 772*109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(events); i++) { 773*109ec558STvrtko Ursulin if (!config_status(i915, events[i].config)) 774*109ec558STvrtko Ursulin count++; 775*109ec558STvrtko Ursulin } 776*109ec558STvrtko Ursulin 777*109ec558STvrtko Ursulin for_each_engine(engine, i915, id) { 778*109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(engine_events); i++) { 779*109ec558STvrtko Ursulin if (!engine_event_status(engine, 780*109ec558STvrtko Ursulin engine_events[i].sample)) 781*109ec558STvrtko Ursulin count++; 782*109ec558STvrtko Ursulin } 783*109ec558STvrtko Ursulin } 784*109ec558STvrtko Ursulin 785*109ec558STvrtko Ursulin /* Allocate attribute objects and table. */ 786*109ec558STvrtko Ursulin i915_attr = kzalloc(count * sizeof(*i915_attr), GFP_KERNEL); 787*109ec558STvrtko Ursulin if (!i915_attr) 788*109ec558STvrtko Ursulin goto err_alloc; 789*109ec558STvrtko Ursulin 790*109ec558STvrtko Ursulin pmu_attr = kzalloc(count * sizeof(*pmu_attr), GFP_KERNEL); 791*109ec558STvrtko Ursulin if (!pmu_attr) 792*109ec558STvrtko Ursulin goto err_alloc; 793*109ec558STvrtko Ursulin 794*109ec558STvrtko Ursulin /* Max one pointer of each attribute type plus a termination entry. */ 795*109ec558STvrtko Ursulin attr = kzalloc((count * 2 + 1) * sizeof(attr), GFP_KERNEL); 796*109ec558STvrtko Ursulin if (!attr) 797*109ec558STvrtko Ursulin goto err_alloc; 798*109ec558STvrtko Ursulin 799*109ec558STvrtko Ursulin i915_iter = i915_attr; 800*109ec558STvrtko Ursulin pmu_iter = pmu_attr; 801*109ec558STvrtko Ursulin attr_iter = attr; 802*109ec558STvrtko Ursulin 803*109ec558STvrtko Ursulin /* Initialize supported non-engine counters. */ 804*109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(events); i++) { 805*109ec558STvrtko Ursulin char *str; 806*109ec558STvrtko Ursulin 807*109ec558STvrtko Ursulin if (config_status(i915, events[i].config)) 808*109ec558STvrtko Ursulin continue; 809*109ec558STvrtko Ursulin 810*109ec558STvrtko Ursulin str = kstrdup(events[i].name, GFP_KERNEL); 811*109ec558STvrtko Ursulin if (!str) 812*109ec558STvrtko Ursulin goto err; 813*109ec558STvrtko Ursulin 814*109ec558STvrtko Ursulin *attr_iter++ = &i915_iter->attr.attr; 815*109ec558STvrtko Ursulin i915_iter = add_i915_attr(i915_iter, str, events[i].config); 816*109ec558STvrtko Ursulin 817*109ec558STvrtko Ursulin if (events[i].unit) { 818*109ec558STvrtko Ursulin str = kasprintf(GFP_KERNEL, "%s.unit", events[i].name); 819*109ec558STvrtko Ursulin if (!str) 820*109ec558STvrtko Ursulin goto err; 821*109ec558STvrtko Ursulin 822*109ec558STvrtko Ursulin *attr_iter++ = &pmu_iter->attr.attr; 823*109ec558STvrtko Ursulin pmu_iter = add_pmu_attr(pmu_iter, str, events[i].unit); 824*109ec558STvrtko Ursulin } 825*109ec558STvrtko Ursulin } 826*109ec558STvrtko Ursulin 827*109ec558STvrtko Ursulin /* Initialize supported engine counters. */ 828*109ec558STvrtko Ursulin for_each_engine(engine, i915, id) { 829*109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(engine_events); i++) { 830*109ec558STvrtko Ursulin char *str; 831*109ec558STvrtko Ursulin 832*109ec558STvrtko Ursulin if (engine_event_status(engine, 833*109ec558STvrtko Ursulin engine_events[i].sample)) 834*109ec558STvrtko Ursulin continue; 835*109ec558STvrtko Ursulin 836*109ec558STvrtko Ursulin str = kasprintf(GFP_KERNEL, "%s-%s", 837*109ec558STvrtko Ursulin engine->name, engine_events[i].name); 838*109ec558STvrtko Ursulin if (!str) 839*109ec558STvrtko Ursulin goto err; 840*109ec558STvrtko Ursulin 841*109ec558STvrtko Ursulin *attr_iter++ = &i915_iter->attr.attr; 842*109ec558STvrtko Ursulin i915_iter = 843*109ec558STvrtko Ursulin add_i915_attr(i915_iter, str, 844*109ec558STvrtko Ursulin __I915_PMU_ENGINE(engine->class, 845*109ec558STvrtko Ursulin engine->instance, 846*109ec558STvrtko Ursulin engine_events[i].sample)); 847*109ec558STvrtko Ursulin 848*109ec558STvrtko Ursulin str = kasprintf(GFP_KERNEL, "%s-%s.unit", 849*109ec558STvrtko Ursulin engine->name, engine_events[i].name); 850*109ec558STvrtko Ursulin if (!str) 851*109ec558STvrtko Ursulin goto err; 852*109ec558STvrtko Ursulin 853*109ec558STvrtko Ursulin *attr_iter++ = &pmu_iter->attr.attr; 854*109ec558STvrtko Ursulin pmu_iter = add_pmu_attr(pmu_iter, str, "ns"); 855*109ec558STvrtko Ursulin } 856*109ec558STvrtko Ursulin } 857*109ec558STvrtko Ursulin 858*109ec558STvrtko Ursulin i915->pmu.i915_attr = i915_attr; 859*109ec558STvrtko Ursulin i915->pmu.pmu_attr = pmu_attr; 860*109ec558STvrtko Ursulin 861*109ec558STvrtko Ursulin return attr; 862*109ec558STvrtko Ursulin 863*109ec558STvrtko Ursulin err:; 864*109ec558STvrtko Ursulin for (attr_iter = attr; *attr_iter; attr_iter++) 865*109ec558STvrtko Ursulin kfree((*attr_iter)->name); 866*109ec558STvrtko Ursulin 867*109ec558STvrtko Ursulin err_alloc: 868*109ec558STvrtko Ursulin kfree(attr); 869*109ec558STvrtko Ursulin kfree(i915_attr); 870*109ec558STvrtko Ursulin kfree(pmu_attr); 871*109ec558STvrtko Ursulin 872*109ec558STvrtko Ursulin return NULL; 873*109ec558STvrtko Ursulin } 874*109ec558STvrtko Ursulin 875*109ec558STvrtko Ursulin static void free_event_attributes(struct drm_i915_private *i915) 876*109ec558STvrtko Ursulin { 877*109ec558STvrtko Ursulin struct attribute **attr_iter = i915_pmu_events_attr_group.attrs; 878*109ec558STvrtko Ursulin 879*109ec558STvrtko Ursulin for (; *attr_iter; attr_iter++) 880*109ec558STvrtko Ursulin kfree((*attr_iter)->name); 881*109ec558STvrtko Ursulin 882*109ec558STvrtko Ursulin kfree(i915_pmu_events_attr_group.attrs); 883*109ec558STvrtko Ursulin kfree(i915->pmu.i915_attr); 884*109ec558STvrtko Ursulin kfree(i915->pmu.pmu_attr); 885*109ec558STvrtko Ursulin 886*109ec558STvrtko Ursulin i915_pmu_events_attr_group.attrs = NULL; 887*109ec558STvrtko Ursulin i915->pmu.i915_attr = NULL; 888*109ec558STvrtko Ursulin i915->pmu.pmu_attr = NULL; 889*109ec558STvrtko Ursulin } 890*109ec558STvrtko Ursulin 891b46a33e2STvrtko Ursulin static int i915_pmu_cpu_online(unsigned int cpu, struct hlist_node *node) 892b46a33e2STvrtko Ursulin { 893b46a33e2STvrtko Ursulin struct i915_pmu *pmu = hlist_entry_safe(node, typeof(*pmu), node); 894b46a33e2STvrtko Ursulin 895b46a33e2STvrtko Ursulin GEM_BUG_ON(!pmu->base.event_init); 896b46a33e2STvrtko Ursulin 897b46a33e2STvrtko Ursulin /* Select the first online CPU as a designated reader. */ 8980426c046STvrtko Ursulin if (!cpumask_weight(&i915_pmu_cpumask)) 899b46a33e2STvrtko Ursulin cpumask_set_cpu(cpu, &i915_pmu_cpumask); 900b46a33e2STvrtko Ursulin 901b46a33e2STvrtko Ursulin return 0; 902b46a33e2STvrtko Ursulin } 903b46a33e2STvrtko Ursulin 904b46a33e2STvrtko Ursulin static int i915_pmu_cpu_offline(unsigned int cpu, struct hlist_node *node) 905b46a33e2STvrtko Ursulin { 906b46a33e2STvrtko Ursulin struct i915_pmu *pmu = hlist_entry_safe(node, typeof(*pmu), node); 907b46a33e2STvrtko Ursulin unsigned int target; 908b46a33e2STvrtko Ursulin 909b46a33e2STvrtko Ursulin GEM_BUG_ON(!pmu->base.event_init); 910b46a33e2STvrtko Ursulin 911b46a33e2STvrtko Ursulin if (cpumask_test_and_clear_cpu(cpu, &i915_pmu_cpumask)) { 912b46a33e2STvrtko Ursulin target = cpumask_any_but(topology_sibling_cpumask(cpu), cpu); 913b46a33e2STvrtko Ursulin /* Migrate events if there is a valid target */ 914b46a33e2STvrtko Ursulin if (target < nr_cpu_ids) { 915b46a33e2STvrtko Ursulin cpumask_set_cpu(target, &i915_pmu_cpumask); 916b46a33e2STvrtko Ursulin perf_pmu_migrate_context(&pmu->base, cpu, target); 917b46a33e2STvrtko Ursulin } 918b46a33e2STvrtko Ursulin } 919b46a33e2STvrtko Ursulin 920b46a33e2STvrtko Ursulin return 0; 921b46a33e2STvrtko Ursulin } 922b46a33e2STvrtko Ursulin 923b46a33e2STvrtko Ursulin static enum cpuhp_state cpuhp_slot = CPUHP_INVALID; 924b46a33e2STvrtko Ursulin 925b46a33e2STvrtko Ursulin static int i915_pmu_register_cpuhp_state(struct drm_i915_private *i915) 926b46a33e2STvrtko Ursulin { 927b46a33e2STvrtko Ursulin enum cpuhp_state slot; 928b46a33e2STvrtko Ursulin int ret; 929b46a33e2STvrtko Ursulin 930b46a33e2STvrtko Ursulin ret = cpuhp_setup_state_multi(CPUHP_AP_ONLINE_DYN, 931b46a33e2STvrtko Ursulin "perf/x86/intel/i915:online", 932b46a33e2STvrtko Ursulin i915_pmu_cpu_online, 933b46a33e2STvrtko Ursulin i915_pmu_cpu_offline); 934b46a33e2STvrtko Ursulin if (ret < 0) 935b46a33e2STvrtko Ursulin return ret; 936b46a33e2STvrtko Ursulin 937b46a33e2STvrtko Ursulin slot = ret; 938b46a33e2STvrtko Ursulin ret = cpuhp_state_add_instance(slot, &i915->pmu.node); 939b46a33e2STvrtko Ursulin if (ret) { 940b46a33e2STvrtko Ursulin cpuhp_remove_multi_state(slot); 941b46a33e2STvrtko Ursulin return ret; 942b46a33e2STvrtko Ursulin } 943b46a33e2STvrtko Ursulin 944b46a33e2STvrtko Ursulin cpuhp_slot = slot; 945b46a33e2STvrtko Ursulin return 0; 946b46a33e2STvrtko Ursulin } 947b46a33e2STvrtko Ursulin 948b46a33e2STvrtko Ursulin static void i915_pmu_unregister_cpuhp_state(struct drm_i915_private *i915) 949b46a33e2STvrtko Ursulin { 950b46a33e2STvrtko Ursulin WARN_ON(cpuhp_slot == CPUHP_INVALID); 951b46a33e2STvrtko Ursulin WARN_ON(cpuhp_state_remove_instance(cpuhp_slot, &i915->pmu.node)); 952b46a33e2STvrtko Ursulin cpuhp_remove_multi_state(cpuhp_slot); 953b46a33e2STvrtko Ursulin } 954b46a33e2STvrtko Ursulin 955b46a33e2STvrtko Ursulin void i915_pmu_register(struct drm_i915_private *i915) 956b46a33e2STvrtko Ursulin { 957b3add01eSTvrtko Ursulin struct intel_engine_cs *engine; 958b3add01eSTvrtko Ursulin enum intel_engine_id id; 959b46a33e2STvrtko Ursulin int ret; 960b46a33e2STvrtko Ursulin 961b46a33e2STvrtko Ursulin if (INTEL_GEN(i915) <= 2) { 962b46a33e2STvrtko Ursulin DRM_INFO("PMU not supported for this GPU."); 963b46a33e2STvrtko Ursulin return; 964b46a33e2STvrtko Ursulin } 965b46a33e2STvrtko Ursulin 966*109ec558STvrtko Ursulin i915_pmu_events_attr_group.attrs = create_event_attributes(i915); 967*109ec558STvrtko Ursulin if (!i915_pmu_events_attr_group.attrs) { 968*109ec558STvrtko Ursulin ret = -ENOMEM; 969*109ec558STvrtko Ursulin goto err; 970*109ec558STvrtko Ursulin } 971*109ec558STvrtko Ursulin 972b46a33e2STvrtko Ursulin i915->pmu.base.attr_groups = i915_pmu_attr_groups; 973b46a33e2STvrtko Ursulin i915->pmu.base.task_ctx_nr = perf_invalid_context; 974b46a33e2STvrtko Ursulin i915->pmu.base.event_init = i915_pmu_event_init; 975b46a33e2STvrtko Ursulin i915->pmu.base.add = i915_pmu_event_add; 976b46a33e2STvrtko Ursulin i915->pmu.base.del = i915_pmu_event_del; 977b46a33e2STvrtko Ursulin i915->pmu.base.start = i915_pmu_event_start; 978b46a33e2STvrtko Ursulin i915->pmu.base.stop = i915_pmu_event_stop; 979b46a33e2STvrtko Ursulin i915->pmu.base.read = i915_pmu_event_read; 980b46a33e2STvrtko Ursulin i915->pmu.base.event_idx = i915_pmu_event_event_idx; 981b46a33e2STvrtko Ursulin 982b46a33e2STvrtko Ursulin spin_lock_init(&i915->pmu.lock); 983b46a33e2STvrtko Ursulin hrtimer_init(&i915->pmu.timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL); 984b46a33e2STvrtko Ursulin i915->pmu.timer.function = i915_sample; 985b46a33e2STvrtko Ursulin 986b3add01eSTvrtko Ursulin for_each_engine(engine, i915, id) 987b3add01eSTvrtko Ursulin INIT_DELAYED_WORK(&engine->pmu.disable_busy_stats, 988b3add01eSTvrtko Ursulin __disable_busy_stats); 989b3add01eSTvrtko Ursulin 990b46a33e2STvrtko Ursulin ret = perf_pmu_register(&i915->pmu.base, "i915", -1); 991b46a33e2STvrtko Ursulin if (ret) 992b46a33e2STvrtko Ursulin goto err; 993b46a33e2STvrtko Ursulin 994b46a33e2STvrtko Ursulin ret = i915_pmu_register_cpuhp_state(i915); 995b46a33e2STvrtko Ursulin if (ret) 996b46a33e2STvrtko Ursulin goto err_unreg; 997b46a33e2STvrtko Ursulin 998b46a33e2STvrtko Ursulin return; 999b46a33e2STvrtko Ursulin 1000b46a33e2STvrtko Ursulin err_unreg: 1001b46a33e2STvrtko Ursulin perf_pmu_unregister(&i915->pmu.base); 1002b46a33e2STvrtko Ursulin err: 1003b46a33e2STvrtko Ursulin i915->pmu.base.event_init = NULL; 1004*109ec558STvrtko Ursulin free_event_attributes(i915); 1005b46a33e2STvrtko Ursulin DRM_NOTE("Failed to register PMU! (err=%d)\n", ret); 1006b46a33e2STvrtko Ursulin } 1007b46a33e2STvrtko Ursulin 1008b46a33e2STvrtko Ursulin void i915_pmu_unregister(struct drm_i915_private *i915) 1009b46a33e2STvrtko Ursulin { 1010b3add01eSTvrtko Ursulin struct intel_engine_cs *engine; 1011b3add01eSTvrtko Ursulin enum intel_engine_id id; 1012b3add01eSTvrtko Ursulin 1013b46a33e2STvrtko Ursulin if (!i915->pmu.base.event_init) 1014b46a33e2STvrtko Ursulin return; 1015b46a33e2STvrtko Ursulin 1016b46a33e2STvrtko Ursulin WARN_ON(i915->pmu.enable); 1017b46a33e2STvrtko Ursulin 1018b46a33e2STvrtko Ursulin hrtimer_cancel(&i915->pmu.timer); 1019b46a33e2STvrtko Ursulin 1020b3add01eSTvrtko Ursulin for_each_engine(engine, i915, id) { 1021b3add01eSTvrtko Ursulin GEM_BUG_ON(engine->pmu.busy_stats); 1022b3add01eSTvrtko Ursulin flush_delayed_work(&engine->pmu.disable_busy_stats); 1023b3add01eSTvrtko Ursulin } 1024b3add01eSTvrtko Ursulin 1025b46a33e2STvrtko Ursulin i915_pmu_unregister_cpuhp_state(i915); 1026b46a33e2STvrtko Ursulin 1027b46a33e2STvrtko Ursulin perf_pmu_unregister(&i915->pmu.base); 1028b46a33e2STvrtko Ursulin i915->pmu.base.event_init = NULL; 1029*109ec558STvrtko Ursulin free_event_attributes(i915); 1030b46a33e2STvrtko Ursulin } 1031