1b46a33e2STvrtko Ursulin /* 2b46a33e2STvrtko Ursulin * Copyright © 2017 Intel Corporation 3b46a33e2STvrtko Ursulin * 4b46a33e2STvrtko Ursulin * Permission is hereby granted, free of charge, to any person obtaining a 5b46a33e2STvrtko Ursulin * copy of this software and associated documentation files (the "Software"), 6b46a33e2STvrtko Ursulin * to deal in the Software without restriction, including without limitation 7b46a33e2STvrtko Ursulin * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8b46a33e2STvrtko Ursulin * and/or sell copies of the Software, and to permit persons to whom the 9b46a33e2STvrtko Ursulin * Software is furnished to do so, subject to the following conditions: 10b46a33e2STvrtko Ursulin * 11b46a33e2STvrtko Ursulin * The above copyright notice and this permission notice (including the next 12b46a33e2STvrtko Ursulin * paragraph) shall be included in all copies or substantial portions of the 13b46a33e2STvrtko Ursulin * Software. 14b46a33e2STvrtko Ursulin * 15b46a33e2STvrtko Ursulin * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16b46a33e2STvrtko Ursulin * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17b46a33e2STvrtko Ursulin * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18b46a33e2STvrtko Ursulin * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19b46a33e2STvrtko Ursulin * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 20b46a33e2STvrtko Ursulin * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 21b46a33e2STvrtko Ursulin * IN THE SOFTWARE. 22b46a33e2STvrtko Ursulin * 23b46a33e2STvrtko Ursulin */ 24b46a33e2STvrtko Ursulin 25b46a33e2STvrtko Ursulin #include <linux/perf_event.h> 26b46a33e2STvrtko Ursulin #include <linux/pm_runtime.h> 27b46a33e2STvrtko Ursulin 28b46a33e2STvrtko Ursulin #include "i915_drv.h" 29b46a33e2STvrtko Ursulin #include "i915_pmu.h" 30b46a33e2STvrtko Ursulin #include "intel_ringbuffer.h" 31b46a33e2STvrtko Ursulin 32b46a33e2STvrtko Ursulin /* Frequency for the sampling timer for events which need it. */ 33b46a33e2STvrtko Ursulin #define FREQUENCY 200 34b46a33e2STvrtko Ursulin #define PERIOD max_t(u64, 10000, NSEC_PER_SEC / FREQUENCY) 35b46a33e2STvrtko Ursulin 36b46a33e2STvrtko Ursulin #define ENGINE_SAMPLE_MASK \ 37b46a33e2STvrtko Ursulin (BIT(I915_SAMPLE_BUSY) | \ 38b46a33e2STvrtko Ursulin BIT(I915_SAMPLE_WAIT) | \ 39b46a33e2STvrtko Ursulin BIT(I915_SAMPLE_SEMA)) 40b46a33e2STvrtko Ursulin 41b46a33e2STvrtko Ursulin #define ENGINE_SAMPLE_BITS (1 << I915_PMU_SAMPLE_BITS) 42b46a33e2STvrtko Ursulin 43141a0895SChris Wilson static cpumask_t i915_pmu_cpumask; 44b46a33e2STvrtko Ursulin 45b46a33e2STvrtko Ursulin static u8 engine_config_sample(u64 config) 46b46a33e2STvrtko Ursulin { 47b46a33e2STvrtko Ursulin return config & I915_PMU_SAMPLE_MASK; 48b46a33e2STvrtko Ursulin } 49b46a33e2STvrtko Ursulin 50b46a33e2STvrtko Ursulin static u8 engine_event_sample(struct perf_event *event) 51b46a33e2STvrtko Ursulin { 52b46a33e2STvrtko Ursulin return engine_config_sample(event->attr.config); 53b46a33e2STvrtko Ursulin } 54b46a33e2STvrtko Ursulin 55b46a33e2STvrtko Ursulin static u8 engine_event_class(struct perf_event *event) 56b46a33e2STvrtko Ursulin { 57b46a33e2STvrtko Ursulin return (event->attr.config >> I915_PMU_CLASS_SHIFT) & 0xff; 58b46a33e2STvrtko Ursulin } 59b46a33e2STvrtko Ursulin 60b46a33e2STvrtko Ursulin static u8 engine_event_instance(struct perf_event *event) 61b46a33e2STvrtko Ursulin { 62b46a33e2STvrtko Ursulin return (event->attr.config >> I915_PMU_SAMPLE_BITS) & 0xff; 63b46a33e2STvrtko Ursulin } 64b46a33e2STvrtko Ursulin 65b46a33e2STvrtko Ursulin static bool is_engine_config(u64 config) 66b46a33e2STvrtko Ursulin { 67b46a33e2STvrtko Ursulin return config < __I915_PMU_OTHER(0); 68b46a33e2STvrtko Ursulin } 69b46a33e2STvrtko Ursulin 70b46a33e2STvrtko Ursulin static unsigned int config_enabled_bit(u64 config) 71b46a33e2STvrtko Ursulin { 72b46a33e2STvrtko Ursulin if (is_engine_config(config)) 73b46a33e2STvrtko Ursulin return engine_config_sample(config); 74b46a33e2STvrtko Ursulin else 75b46a33e2STvrtko Ursulin return ENGINE_SAMPLE_BITS + (config - __I915_PMU_OTHER(0)); 76b46a33e2STvrtko Ursulin } 77b46a33e2STvrtko Ursulin 78b46a33e2STvrtko Ursulin static u64 config_enabled_mask(u64 config) 79b46a33e2STvrtko Ursulin { 80b46a33e2STvrtko Ursulin return BIT_ULL(config_enabled_bit(config)); 81b46a33e2STvrtko Ursulin } 82b46a33e2STvrtko Ursulin 83b46a33e2STvrtko Ursulin static bool is_engine_event(struct perf_event *event) 84b46a33e2STvrtko Ursulin { 85b46a33e2STvrtko Ursulin return is_engine_config(event->attr.config); 86b46a33e2STvrtko Ursulin } 87b46a33e2STvrtko Ursulin 88b46a33e2STvrtko Ursulin static unsigned int event_enabled_bit(struct perf_event *event) 89b46a33e2STvrtko Ursulin { 90b46a33e2STvrtko Ursulin return config_enabled_bit(event->attr.config); 91b46a33e2STvrtko Ursulin } 92b46a33e2STvrtko Ursulin 93feff0dc6STvrtko Ursulin static bool pmu_needs_timer(struct drm_i915_private *i915, bool gpu_active) 94feff0dc6STvrtko Ursulin { 95feff0dc6STvrtko Ursulin u64 enable; 96feff0dc6STvrtko Ursulin 97feff0dc6STvrtko Ursulin /* 98feff0dc6STvrtko Ursulin * Only some counters need the sampling timer. 99feff0dc6STvrtko Ursulin * 100feff0dc6STvrtko Ursulin * We start with a bitmask of all currently enabled events. 101feff0dc6STvrtko Ursulin */ 102feff0dc6STvrtko Ursulin enable = i915->pmu.enable; 103feff0dc6STvrtko Ursulin 104feff0dc6STvrtko Ursulin /* 105feff0dc6STvrtko Ursulin * Mask out all the ones which do not need the timer, or in 106feff0dc6STvrtko Ursulin * other words keep all the ones that could need the timer. 107feff0dc6STvrtko Ursulin */ 108feff0dc6STvrtko Ursulin enable &= config_enabled_mask(I915_PMU_ACTUAL_FREQUENCY) | 109feff0dc6STvrtko Ursulin config_enabled_mask(I915_PMU_REQUESTED_FREQUENCY) | 110feff0dc6STvrtko Ursulin ENGINE_SAMPLE_MASK; 111feff0dc6STvrtko Ursulin 112feff0dc6STvrtko Ursulin /* 113feff0dc6STvrtko Ursulin * When the GPU is idle per-engine counters do not need to be 114feff0dc6STvrtko Ursulin * running so clear those bits out. 115feff0dc6STvrtko Ursulin */ 116feff0dc6STvrtko Ursulin if (!gpu_active) 117feff0dc6STvrtko Ursulin enable &= ~ENGINE_SAMPLE_MASK; 118b3add01eSTvrtko Ursulin /* 119b3add01eSTvrtko Ursulin * Also there is software busyness tracking available we do not 120b3add01eSTvrtko Ursulin * need the timer for I915_SAMPLE_BUSY counter. 121cf669b4eSTvrtko Ursulin * 122cf669b4eSTvrtko Ursulin * Use RCS as proxy for all engines. 123b3add01eSTvrtko Ursulin */ 124cf669b4eSTvrtko Ursulin else if (intel_engine_supports_stats(i915->engine[RCS])) 125b3add01eSTvrtko Ursulin enable &= ~BIT(I915_SAMPLE_BUSY); 126feff0dc6STvrtko Ursulin 127feff0dc6STvrtko Ursulin /* 128feff0dc6STvrtko Ursulin * If some bits remain it means we need the sampling timer running. 129feff0dc6STvrtko Ursulin */ 130feff0dc6STvrtko Ursulin return enable; 131feff0dc6STvrtko Ursulin } 132feff0dc6STvrtko Ursulin 133feff0dc6STvrtko Ursulin void i915_pmu_gt_parked(struct drm_i915_private *i915) 134feff0dc6STvrtko Ursulin { 135feff0dc6STvrtko Ursulin if (!i915->pmu.base.event_init) 136feff0dc6STvrtko Ursulin return; 137feff0dc6STvrtko Ursulin 138feff0dc6STvrtko Ursulin spin_lock_irq(&i915->pmu.lock); 139feff0dc6STvrtko Ursulin /* 140feff0dc6STvrtko Ursulin * Signal sampling timer to stop if only engine events are enabled and 141feff0dc6STvrtko Ursulin * GPU went idle. 142feff0dc6STvrtko Ursulin */ 143feff0dc6STvrtko Ursulin i915->pmu.timer_enabled = pmu_needs_timer(i915, false); 144feff0dc6STvrtko Ursulin spin_unlock_irq(&i915->pmu.lock); 145feff0dc6STvrtko Ursulin } 146feff0dc6STvrtko Ursulin 147feff0dc6STvrtko Ursulin static void __i915_pmu_maybe_start_timer(struct drm_i915_private *i915) 148feff0dc6STvrtko Ursulin { 149feff0dc6STvrtko Ursulin if (!i915->pmu.timer_enabled && pmu_needs_timer(i915, true)) { 150feff0dc6STvrtko Ursulin i915->pmu.timer_enabled = true; 151feff0dc6STvrtko Ursulin hrtimer_start_range_ns(&i915->pmu.timer, 152feff0dc6STvrtko Ursulin ns_to_ktime(PERIOD), 0, 153feff0dc6STvrtko Ursulin HRTIMER_MODE_REL_PINNED); 154feff0dc6STvrtko Ursulin } 155feff0dc6STvrtko Ursulin } 156feff0dc6STvrtko Ursulin 157feff0dc6STvrtko Ursulin void i915_pmu_gt_unparked(struct drm_i915_private *i915) 158feff0dc6STvrtko Ursulin { 159feff0dc6STvrtko Ursulin if (!i915->pmu.base.event_init) 160feff0dc6STvrtko Ursulin return; 161feff0dc6STvrtko Ursulin 162feff0dc6STvrtko Ursulin spin_lock_irq(&i915->pmu.lock); 163feff0dc6STvrtko Ursulin /* 164feff0dc6STvrtko Ursulin * Re-enable sampling timer when GPU goes active. 165feff0dc6STvrtko Ursulin */ 166feff0dc6STvrtko Ursulin __i915_pmu_maybe_start_timer(i915); 167feff0dc6STvrtko Ursulin spin_unlock_irq(&i915->pmu.lock); 168feff0dc6STvrtko Ursulin } 169feff0dc6STvrtko Ursulin 170b46a33e2STvrtko Ursulin static bool grab_forcewake(struct drm_i915_private *i915, bool fw) 171b46a33e2STvrtko Ursulin { 172b46a33e2STvrtko Ursulin if (!fw) 173b46a33e2STvrtko Ursulin intel_uncore_forcewake_get(i915, FORCEWAKE_ALL); 174b46a33e2STvrtko Ursulin 175b46a33e2STvrtko Ursulin return true; 176b46a33e2STvrtko Ursulin } 177b46a33e2STvrtko Ursulin 178b46a33e2STvrtko Ursulin static void 179b46a33e2STvrtko Ursulin update_sample(struct i915_pmu_sample *sample, u32 unit, u32 val) 180b46a33e2STvrtko Ursulin { 1818ee4f19cSTvrtko Ursulin sample->cur += mul_u32_u32(val, unit); 182b46a33e2STvrtko Ursulin } 183b46a33e2STvrtko Ursulin 184b46a33e2STvrtko Ursulin static void engines_sample(struct drm_i915_private *dev_priv) 185b46a33e2STvrtko Ursulin { 186b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 187b46a33e2STvrtko Ursulin enum intel_engine_id id; 188b46a33e2STvrtko Ursulin bool fw = false; 189b46a33e2STvrtko Ursulin 190b46a33e2STvrtko Ursulin if ((dev_priv->pmu.enable & ENGINE_SAMPLE_MASK) == 0) 191b46a33e2STvrtko Ursulin return; 192b46a33e2STvrtko Ursulin 193b46a33e2STvrtko Ursulin if (!dev_priv->gt.awake) 194b46a33e2STvrtko Ursulin return; 195b46a33e2STvrtko Ursulin 196b46a33e2STvrtko Ursulin if (!intel_runtime_pm_get_if_in_use(dev_priv)) 197b46a33e2STvrtko Ursulin return; 198b46a33e2STvrtko Ursulin 199b46a33e2STvrtko Ursulin for_each_engine(engine, dev_priv, id) { 200b46a33e2STvrtko Ursulin u32 current_seqno = intel_engine_get_seqno(engine); 201b46a33e2STvrtko Ursulin u32 last_seqno = intel_engine_last_submit(engine); 202b46a33e2STvrtko Ursulin u32 val; 203b46a33e2STvrtko Ursulin 204b46a33e2STvrtko Ursulin val = !i915_seqno_passed(current_seqno, last_seqno); 205b46a33e2STvrtko Ursulin 206b46a33e2STvrtko Ursulin update_sample(&engine->pmu.sample[I915_SAMPLE_BUSY], 207b46a33e2STvrtko Ursulin PERIOD, val); 208b46a33e2STvrtko Ursulin 209b46a33e2STvrtko Ursulin if (val && (engine->pmu.enable & 210b46a33e2STvrtko Ursulin (BIT(I915_SAMPLE_WAIT) | BIT(I915_SAMPLE_SEMA)))) { 211b46a33e2STvrtko Ursulin fw = grab_forcewake(dev_priv, fw); 212b46a33e2STvrtko Ursulin 213b46a33e2STvrtko Ursulin val = I915_READ_FW(RING_CTL(engine->mmio_base)); 214b46a33e2STvrtko Ursulin } else { 215b46a33e2STvrtko Ursulin val = 0; 216b46a33e2STvrtko Ursulin } 217b46a33e2STvrtko Ursulin 218b46a33e2STvrtko Ursulin update_sample(&engine->pmu.sample[I915_SAMPLE_WAIT], 219b46a33e2STvrtko Ursulin PERIOD, !!(val & RING_WAIT)); 220b46a33e2STvrtko Ursulin 221b46a33e2STvrtko Ursulin update_sample(&engine->pmu.sample[I915_SAMPLE_SEMA], 222b46a33e2STvrtko Ursulin PERIOD, !!(val & RING_WAIT_SEMAPHORE)); 223b46a33e2STvrtko Ursulin } 224b46a33e2STvrtko Ursulin 225b46a33e2STvrtko Ursulin if (fw) 226b46a33e2STvrtko Ursulin intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL); 227b46a33e2STvrtko Ursulin 228b46a33e2STvrtko Ursulin intel_runtime_pm_put(dev_priv); 229b46a33e2STvrtko Ursulin } 230b46a33e2STvrtko Ursulin 231b46a33e2STvrtko Ursulin static void frequency_sample(struct drm_i915_private *dev_priv) 232b46a33e2STvrtko Ursulin { 233b46a33e2STvrtko Ursulin if (dev_priv->pmu.enable & 234b46a33e2STvrtko Ursulin config_enabled_mask(I915_PMU_ACTUAL_FREQUENCY)) { 235b46a33e2STvrtko Ursulin u32 val; 236b46a33e2STvrtko Ursulin 237b46a33e2STvrtko Ursulin val = dev_priv->gt_pm.rps.cur_freq; 238b46a33e2STvrtko Ursulin if (dev_priv->gt.awake && 239b46a33e2STvrtko Ursulin intel_runtime_pm_get_if_in_use(dev_priv)) { 240b46a33e2STvrtko Ursulin val = intel_get_cagf(dev_priv, 241b46a33e2STvrtko Ursulin I915_READ_NOTRACE(GEN6_RPSTAT1)); 242b46a33e2STvrtko Ursulin intel_runtime_pm_put(dev_priv); 243b46a33e2STvrtko Ursulin } 244b46a33e2STvrtko Ursulin 245b46a33e2STvrtko Ursulin update_sample(&dev_priv->pmu.sample[__I915_SAMPLE_FREQ_ACT], 246b46a33e2STvrtko Ursulin 1, intel_gpu_freq(dev_priv, val)); 247b46a33e2STvrtko Ursulin } 248b46a33e2STvrtko Ursulin 249b46a33e2STvrtko Ursulin if (dev_priv->pmu.enable & 250b46a33e2STvrtko Ursulin config_enabled_mask(I915_PMU_REQUESTED_FREQUENCY)) { 251b46a33e2STvrtko Ursulin update_sample(&dev_priv->pmu.sample[__I915_SAMPLE_FREQ_REQ], 1, 252b46a33e2STvrtko Ursulin intel_gpu_freq(dev_priv, 253b46a33e2STvrtko Ursulin dev_priv->gt_pm.rps.cur_freq)); 254b46a33e2STvrtko Ursulin } 255b46a33e2STvrtko Ursulin } 256b46a33e2STvrtko Ursulin 257b46a33e2STvrtko Ursulin static enum hrtimer_restart i915_sample(struct hrtimer *hrtimer) 258b46a33e2STvrtko Ursulin { 259b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 260b46a33e2STvrtko Ursulin container_of(hrtimer, struct drm_i915_private, pmu.timer); 261b46a33e2STvrtko Ursulin 2628ee4f19cSTvrtko Ursulin if (!READ_ONCE(i915->pmu.timer_enabled)) 263b46a33e2STvrtko Ursulin return HRTIMER_NORESTART; 264b46a33e2STvrtko Ursulin 265b46a33e2STvrtko Ursulin engines_sample(i915); 266b46a33e2STvrtko Ursulin frequency_sample(i915); 267b46a33e2STvrtko Ursulin 268b46a33e2STvrtko Ursulin hrtimer_forward_now(hrtimer, ns_to_ktime(PERIOD)); 269b46a33e2STvrtko Ursulin return HRTIMER_RESTART; 270b46a33e2STvrtko Ursulin } 271b46a33e2STvrtko Ursulin 2720cd4684dSTvrtko Ursulin static u64 count_interrupts(struct drm_i915_private *i915) 2730cd4684dSTvrtko Ursulin { 2740cd4684dSTvrtko Ursulin /* open-coded kstat_irqs() */ 2750cd4684dSTvrtko Ursulin struct irq_desc *desc = irq_to_desc(i915->drm.pdev->irq); 2760cd4684dSTvrtko Ursulin u64 sum = 0; 2770cd4684dSTvrtko Ursulin int cpu; 2780cd4684dSTvrtko Ursulin 2790cd4684dSTvrtko Ursulin if (!desc || !desc->kstat_irqs) 2800cd4684dSTvrtko Ursulin return 0; 2810cd4684dSTvrtko Ursulin 2820cd4684dSTvrtko Ursulin for_each_possible_cpu(cpu) 2830cd4684dSTvrtko Ursulin sum += *per_cpu_ptr(desc->kstat_irqs, cpu); 2840cd4684dSTvrtko Ursulin 2850cd4684dSTvrtko Ursulin return sum; 2860cd4684dSTvrtko Ursulin } 2870cd4684dSTvrtko Ursulin 288b46a33e2STvrtko Ursulin static void i915_pmu_event_destroy(struct perf_event *event) 289b46a33e2STvrtko Ursulin { 290b46a33e2STvrtko Ursulin WARN_ON(event->parent); 291b46a33e2STvrtko Ursulin } 292b46a33e2STvrtko Ursulin 293109ec558STvrtko Ursulin static int 294109ec558STvrtko Ursulin engine_event_status(struct intel_engine_cs *engine, 295109ec558STvrtko Ursulin enum drm_i915_pmu_engine_sample sample) 296b46a33e2STvrtko Ursulin { 297109ec558STvrtko Ursulin switch (sample) { 298b46a33e2STvrtko Ursulin case I915_SAMPLE_BUSY: 299b46a33e2STvrtko Ursulin case I915_SAMPLE_WAIT: 300b46a33e2STvrtko Ursulin break; 301b46a33e2STvrtko Ursulin case I915_SAMPLE_SEMA: 302109ec558STvrtko Ursulin if (INTEL_GEN(engine->i915) < 6) 303b46a33e2STvrtko Ursulin return -ENODEV; 304b46a33e2STvrtko Ursulin break; 305b46a33e2STvrtko Ursulin default: 306b46a33e2STvrtko Ursulin return -ENOENT; 307b46a33e2STvrtko Ursulin } 308b46a33e2STvrtko Ursulin 309b46a33e2STvrtko Ursulin return 0; 310b46a33e2STvrtko Ursulin } 311b46a33e2STvrtko Ursulin 312109ec558STvrtko Ursulin static int 313109ec558STvrtko Ursulin config_status(struct drm_i915_private *i915, u64 config) 314109ec558STvrtko Ursulin { 315109ec558STvrtko Ursulin switch (config) { 316109ec558STvrtko Ursulin case I915_PMU_ACTUAL_FREQUENCY: 317109ec558STvrtko Ursulin if (IS_VALLEYVIEW(i915) || IS_CHERRYVIEW(i915)) 318109ec558STvrtko Ursulin /* Requires a mutex for sampling! */ 319109ec558STvrtko Ursulin return -ENODEV; 320109ec558STvrtko Ursulin /* Fall-through. */ 321109ec558STvrtko Ursulin case I915_PMU_REQUESTED_FREQUENCY: 322109ec558STvrtko Ursulin if (INTEL_GEN(i915) < 6) 323109ec558STvrtko Ursulin return -ENODEV; 324109ec558STvrtko Ursulin break; 325109ec558STvrtko Ursulin case I915_PMU_INTERRUPTS: 326109ec558STvrtko Ursulin break; 327109ec558STvrtko Ursulin case I915_PMU_RC6_RESIDENCY: 328109ec558STvrtko Ursulin if (!HAS_RC6(i915)) 329109ec558STvrtko Ursulin return -ENODEV; 330109ec558STvrtko Ursulin break; 331109ec558STvrtko Ursulin default: 332109ec558STvrtko Ursulin return -ENOENT; 333109ec558STvrtko Ursulin } 334109ec558STvrtko Ursulin 335109ec558STvrtko Ursulin return 0; 336109ec558STvrtko Ursulin } 337109ec558STvrtko Ursulin 338109ec558STvrtko Ursulin static int engine_event_init(struct perf_event *event) 339109ec558STvrtko Ursulin { 340109ec558STvrtko Ursulin struct drm_i915_private *i915 = 341109ec558STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 342109ec558STvrtko Ursulin struct intel_engine_cs *engine; 343109ec558STvrtko Ursulin 344109ec558STvrtko Ursulin engine = intel_engine_lookup_user(i915, engine_event_class(event), 345109ec558STvrtko Ursulin engine_event_instance(event)); 346109ec558STvrtko Ursulin if (!engine) 347109ec558STvrtko Ursulin return -ENODEV; 348109ec558STvrtko Ursulin 349109ec558STvrtko Ursulin return engine_event_status(engine, engine_event_sample(event)); 350109ec558STvrtko Ursulin } 351109ec558STvrtko Ursulin 352b46a33e2STvrtko Ursulin static int i915_pmu_event_init(struct perf_event *event) 353b46a33e2STvrtko Ursulin { 354b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 355b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 3560426c046STvrtko Ursulin int ret; 357b46a33e2STvrtko Ursulin 358b46a33e2STvrtko Ursulin if (event->attr.type != event->pmu->type) 359b46a33e2STvrtko Ursulin return -ENOENT; 360b46a33e2STvrtko Ursulin 361b46a33e2STvrtko Ursulin /* unsupported modes and filters */ 362b46a33e2STvrtko Ursulin if (event->attr.sample_period) /* no sampling */ 363b46a33e2STvrtko Ursulin return -EINVAL; 364b46a33e2STvrtko Ursulin 365b46a33e2STvrtko Ursulin if (has_branch_stack(event)) 366b46a33e2STvrtko Ursulin return -EOPNOTSUPP; 367b46a33e2STvrtko Ursulin 368b46a33e2STvrtko Ursulin if (event->cpu < 0) 369b46a33e2STvrtko Ursulin return -EINVAL; 370b46a33e2STvrtko Ursulin 3710426c046STvrtko Ursulin /* only allow running on one cpu at a time */ 3720426c046STvrtko Ursulin if (!cpumask_test_cpu(event->cpu, &i915_pmu_cpumask)) 37300a79722STvrtko Ursulin return -EINVAL; 374b46a33e2STvrtko Ursulin 375109ec558STvrtko Ursulin if (is_engine_event(event)) 376b46a33e2STvrtko Ursulin ret = engine_event_init(event); 377109ec558STvrtko Ursulin else 378109ec558STvrtko Ursulin ret = config_status(i915, event->attr.config); 379b46a33e2STvrtko Ursulin if (ret) 380b46a33e2STvrtko Ursulin return ret; 381b46a33e2STvrtko Ursulin 382b46a33e2STvrtko Ursulin if (!event->parent) 383b46a33e2STvrtko Ursulin event->destroy = i915_pmu_event_destroy; 384b46a33e2STvrtko Ursulin 385b46a33e2STvrtko Ursulin return 0; 386b46a33e2STvrtko Ursulin } 387b46a33e2STvrtko Ursulin 388b46a33e2STvrtko Ursulin static u64 __i915_pmu_event_read(struct perf_event *event) 389b46a33e2STvrtko Ursulin { 390b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 391b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 392b46a33e2STvrtko Ursulin u64 val = 0; 393b46a33e2STvrtko Ursulin 394b46a33e2STvrtko Ursulin if (is_engine_event(event)) { 395b46a33e2STvrtko Ursulin u8 sample = engine_event_sample(event); 396b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 397b46a33e2STvrtko Ursulin 398b46a33e2STvrtko Ursulin engine = intel_engine_lookup_user(i915, 399b46a33e2STvrtko Ursulin engine_event_class(event), 400b46a33e2STvrtko Ursulin engine_event_instance(event)); 401b46a33e2STvrtko Ursulin 402b46a33e2STvrtko Ursulin if (WARN_ON_ONCE(!engine)) { 403b46a33e2STvrtko Ursulin /* Do nothing */ 404b3add01eSTvrtko Ursulin } else if (sample == I915_SAMPLE_BUSY && 405b3add01eSTvrtko Ursulin engine->pmu.busy_stats) { 406b3add01eSTvrtko Ursulin val = ktime_to_ns(intel_engine_get_busy_time(engine)); 407b46a33e2STvrtko Ursulin } else { 408b46a33e2STvrtko Ursulin val = engine->pmu.sample[sample].cur; 409b46a33e2STvrtko Ursulin } 410b46a33e2STvrtko Ursulin } else { 411b46a33e2STvrtko Ursulin switch (event->attr.config) { 412b46a33e2STvrtko Ursulin case I915_PMU_ACTUAL_FREQUENCY: 413b46a33e2STvrtko Ursulin val = 414b46a33e2STvrtko Ursulin div_u64(i915->pmu.sample[__I915_SAMPLE_FREQ_ACT].cur, 415b46a33e2STvrtko Ursulin FREQUENCY); 416b46a33e2STvrtko Ursulin break; 417b46a33e2STvrtko Ursulin case I915_PMU_REQUESTED_FREQUENCY: 418b46a33e2STvrtko Ursulin val = 419b46a33e2STvrtko Ursulin div_u64(i915->pmu.sample[__I915_SAMPLE_FREQ_REQ].cur, 420b46a33e2STvrtko Ursulin FREQUENCY); 421b46a33e2STvrtko Ursulin break; 4220cd4684dSTvrtko Ursulin case I915_PMU_INTERRUPTS: 4230cd4684dSTvrtko Ursulin val = count_interrupts(i915); 4240cd4684dSTvrtko Ursulin break; 4256060b6aeSTvrtko Ursulin case I915_PMU_RC6_RESIDENCY: 4266060b6aeSTvrtko Ursulin intel_runtime_pm_get(i915); 4276060b6aeSTvrtko Ursulin val = intel_rc6_residency_ns(i915, 4286060b6aeSTvrtko Ursulin IS_VALLEYVIEW(i915) ? 4296060b6aeSTvrtko Ursulin VLV_GT_RENDER_RC6 : 4306060b6aeSTvrtko Ursulin GEN6_GT_GFX_RC6); 431fb6db0f5SChris Wilson if (HAS_RC6p(i915)) 4323452fa30STvrtko Ursulin val += intel_rc6_residency_ns(i915, 4333452fa30STvrtko Ursulin GEN6_GT_GFX_RC6p); 434fb6db0f5SChris Wilson if (HAS_RC6pp(i915)) 4353452fa30STvrtko Ursulin val += intel_rc6_residency_ns(i915, 4363452fa30STvrtko Ursulin GEN6_GT_GFX_RC6pp); 4376060b6aeSTvrtko Ursulin intel_runtime_pm_put(i915); 4386060b6aeSTvrtko Ursulin break; 439b46a33e2STvrtko Ursulin } 440b46a33e2STvrtko Ursulin } 441b46a33e2STvrtko Ursulin 442b46a33e2STvrtko Ursulin return val; 443b46a33e2STvrtko Ursulin } 444b46a33e2STvrtko Ursulin 445b46a33e2STvrtko Ursulin static void i915_pmu_event_read(struct perf_event *event) 446b46a33e2STvrtko Ursulin { 447b46a33e2STvrtko Ursulin struct hw_perf_event *hwc = &event->hw; 448b46a33e2STvrtko Ursulin u64 prev, new; 449b46a33e2STvrtko Ursulin 450b46a33e2STvrtko Ursulin again: 451b46a33e2STvrtko Ursulin prev = local64_read(&hwc->prev_count); 452b46a33e2STvrtko Ursulin new = __i915_pmu_event_read(event); 453b46a33e2STvrtko Ursulin 454b46a33e2STvrtko Ursulin if (local64_cmpxchg(&hwc->prev_count, prev, new) != prev) 455b46a33e2STvrtko Ursulin goto again; 456b46a33e2STvrtko Ursulin 457b46a33e2STvrtko Ursulin local64_add(new - prev, &event->count); 458b46a33e2STvrtko Ursulin } 459b46a33e2STvrtko Ursulin 460b3add01eSTvrtko Ursulin static bool engine_needs_busy_stats(struct intel_engine_cs *engine) 461b3add01eSTvrtko Ursulin { 462cf669b4eSTvrtko Ursulin return intel_engine_supports_stats(engine) && 463b3add01eSTvrtko Ursulin (engine->pmu.enable & BIT(I915_SAMPLE_BUSY)); 464b3add01eSTvrtko Ursulin } 465b3add01eSTvrtko Ursulin 466b46a33e2STvrtko Ursulin static void i915_pmu_enable(struct perf_event *event) 467b46a33e2STvrtko Ursulin { 468b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 469b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 470b46a33e2STvrtko Ursulin unsigned int bit = event_enabled_bit(event); 471b46a33e2STvrtko Ursulin unsigned long flags; 472b46a33e2STvrtko Ursulin 473b46a33e2STvrtko Ursulin spin_lock_irqsave(&i915->pmu.lock, flags); 474b46a33e2STvrtko Ursulin 475b46a33e2STvrtko Ursulin /* 476b46a33e2STvrtko Ursulin * Update the bitmask of enabled events and increment 477b46a33e2STvrtko Ursulin * the event reference counter. 478b46a33e2STvrtko Ursulin */ 479b46a33e2STvrtko Ursulin GEM_BUG_ON(bit >= I915_PMU_MASK_BITS); 480b46a33e2STvrtko Ursulin GEM_BUG_ON(i915->pmu.enable_count[bit] == ~0); 481b46a33e2STvrtko Ursulin i915->pmu.enable |= BIT_ULL(bit); 482b46a33e2STvrtko Ursulin i915->pmu.enable_count[bit]++; 483b46a33e2STvrtko Ursulin 484b46a33e2STvrtko Ursulin /* 485feff0dc6STvrtko Ursulin * Start the sampling timer if needed and not already enabled. 486feff0dc6STvrtko Ursulin */ 487feff0dc6STvrtko Ursulin __i915_pmu_maybe_start_timer(i915); 488feff0dc6STvrtko Ursulin 489feff0dc6STvrtko Ursulin /* 490b46a33e2STvrtko Ursulin * For per-engine events the bitmask and reference counting 491b46a33e2STvrtko Ursulin * is stored per engine. 492b46a33e2STvrtko Ursulin */ 493b46a33e2STvrtko Ursulin if (is_engine_event(event)) { 494b46a33e2STvrtko Ursulin u8 sample = engine_event_sample(event); 495b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 496b46a33e2STvrtko Ursulin 497b46a33e2STvrtko Ursulin engine = intel_engine_lookup_user(i915, 498b46a33e2STvrtko Ursulin engine_event_class(event), 499b46a33e2STvrtko Ursulin engine_event_instance(event)); 500b46a33e2STvrtko Ursulin GEM_BUG_ON(!engine); 501b46a33e2STvrtko Ursulin engine->pmu.enable |= BIT(sample); 502b46a33e2STvrtko Ursulin 503b46a33e2STvrtko Ursulin GEM_BUG_ON(sample >= I915_PMU_SAMPLE_BITS); 504b46a33e2STvrtko Ursulin GEM_BUG_ON(engine->pmu.enable_count[sample] == ~0); 505b3add01eSTvrtko Ursulin if (engine->pmu.enable_count[sample]++ == 0) { 506b3add01eSTvrtko Ursulin /* 507b3add01eSTvrtko Ursulin * Enable engine busy stats tracking if needed or 508b3add01eSTvrtko Ursulin * alternatively cancel the scheduled disable. 509b3add01eSTvrtko Ursulin * 510b3add01eSTvrtko Ursulin * If the delayed disable was pending, cancel it and 511b3add01eSTvrtko Ursulin * in this case do not enable since it already is. 512b3add01eSTvrtko Ursulin */ 513b3add01eSTvrtko Ursulin if (engine_needs_busy_stats(engine) && 514b3add01eSTvrtko Ursulin !engine->pmu.busy_stats) { 515b3add01eSTvrtko Ursulin engine->pmu.busy_stats = true; 516b3add01eSTvrtko Ursulin if (!cancel_delayed_work(&engine->pmu.disable_busy_stats)) 517b3add01eSTvrtko Ursulin intel_enable_engine_stats(engine); 518b3add01eSTvrtko Ursulin } 519b3add01eSTvrtko Ursulin } 520b46a33e2STvrtko Ursulin } 521b46a33e2STvrtko Ursulin 522b46a33e2STvrtko Ursulin /* 523b46a33e2STvrtko Ursulin * Store the current counter value so we can report the correct delta 524b46a33e2STvrtko Ursulin * for all listeners. Even when the event was already enabled and has 525b46a33e2STvrtko Ursulin * an existing non-zero value. 526b46a33e2STvrtko Ursulin */ 527b46a33e2STvrtko Ursulin local64_set(&event->hw.prev_count, __i915_pmu_event_read(event)); 528b46a33e2STvrtko Ursulin 529b46a33e2STvrtko Ursulin spin_unlock_irqrestore(&i915->pmu.lock, flags); 530b46a33e2STvrtko Ursulin } 531b46a33e2STvrtko Ursulin 532b3add01eSTvrtko Ursulin static void __disable_busy_stats(struct work_struct *work) 533b3add01eSTvrtko Ursulin { 534b3add01eSTvrtko Ursulin struct intel_engine_cs *engine = 535b3add01eSTvrtko Ursulin container_of(work, typeof(*engine), pmu.disable_busy_stats.work); 536b3add01eSTvrtko Ursulin 537b3add01eSTvrtko Ursulin intel_disable_engine_stats(engine); 538b3add01eSTvrtko Ursulin } 539b3add01eSTvrtko Ursulin 540b46a33e2STvrtko Ursulin static void i915_pmu_disable(struct perf_event *event) 541b46a33e2STvrtko Ursulin { 542b46a33e2STvrtko Ursulin struct drm_i915_private *i915 = 543b46a33e2STvrtko Ursulin container_of(event->pmu, typeof(*i915), pmu.base); 544b46a33e2STvrtko Ursulin unsigned int bit = event_enabled_bit(event); 545b46a33e2STvrtko Ursulin unsigned long flags; 546b46a33e2STvrtko Ursulin 547b46a33e2STvrtko Ursulin spin_lock_irqsave(&i915->pmu.lock, flags); 548b46a33e2STvrtko Ursulin 549b46a33e2STvrtko Ursulin if (is_engine_event(event)) { 550b46a33e2STvrtko Ursulin u8 sample = engine_event_sample(event); 551b46a33e2STvrtko Ursulin struct intel_engine_cs *engine; 552b46a33e2STvrtko Ursulin 553b46a33e2STvrtko Ursulin engine = intel_engine_lookup_user(i915, 554b46a33e2STvrtko Ursulin engine_event_class(event), 555b46a33e2STvrtko Ursulin engine_event_instance(event)); 556b46a33e2STvrtko Ursulin GEM_BUG_ON(!engine); 557b46a33e2STvrtko Ursulin GEM_BUG_ON(sample >= I915_PMU_SAMPLE_BITS); 558b46a33e2STvrtko Ursulin GEM_BUG_ON(engine->pmu.enable_count[sample] == 0); 559b46a33e2STvrtko Ursulin /* 560b46a33e2STvrtko Ursulin * Decrement the reference count and clear the enabled 561b46a33e2STvrtko Ursulin * bitmask when the last listener on an event goes away. 562b46a33e2STvrtko Ursulin */ 563b3add01eSTvrtko Ursulin if (--engine->pmu.enable_count[sample] == 0) { 564b46a33e2STvrtko Ursulin engine->pmu.enable &= ~BIT(sample); 565b3add01eSTvrtko Ursulin if (!engine_needs_busy_stats(engine) && 566b3add01eSTvrtko Ursulin engine->pmu.busy_stats) { 567b3add01eSTvrtko Ursulin engine->pmu.busy_stats = false; 568b3add01eSTvrtko Ursulin /* 569b3add01eSTvrtko Ursulin * We request a delayed disable to handle the 570b3add01eSTvrtko Ursulin * rapid on/off cycles on events, which can 571b3add01eSTvrtko Ursulin * happen when tools like perf stat start, in a 572b3add01eSTvrtko Ursulin * nicer way. 573b3add01eSTvrtko Ursulin * 574b3add01eSTvrtko Ursulin * In addition, this also helps with busy stats 575b3add01eSTvrtko Ursulin * accuracy with background CPU offline/online 576b3add01eSTvrtko Ursulin * migration events. 577b3add01eSTvrtko Ursulin */ 578b3add01eSTvrtko Ursulin queue_delayed_work(system_wq, 579b3add01eSTvrtko Ursulin &engine->pmu.disable_busy_stats, 580b3add01eSTvrtko Ursulin round_jiffies_up_relative(HZ)); 581b3add01eSTvrtko Ursulin } 582b3add01eSTvrtko Ursulin } 583b46a33e2STvrtko Ursulin } 584b46a33e2STvrtko Ursulin 585b46a33e2STvrtko Ursulin GEM_BUG_ON(bit >= I915_PMU_MASK_BITS); 586b46a33e2STvrtko Ursulin GEM_BUG_ON(i915->pmu.enable_count[bit] == 0); 587b46a33e2STvrtko Ursulin /* 588b46a33e2STvrtko Ursulin * Decrement the reference count and clear the enabled 589b46a33e2STvrtko Ursulin * bitmask when the last listener on an event goes away. 590b46a33e2STvrtko Ursulin */ 591feff0dc6STvrtko Ursulin if (--i915->pmu.enable_count[bit] == 0) { 592b46a33e2STvrtko Ursulin i915->pmu.enable &= ~BIT_ULL(bit); 593feff0dc6STvrtko Ursulin i915->pmu.timer_enabled &= pmu_needs_timer(i915, true); 594feff0dc6STvrtko Ursulin } 595b46a33e2STvrtko Ursulin 596b46a33e2STvrtko Ursulin spin_unlock_irqrestore(&i915->pmu.lock, flags); 597b46a33e2STvrtko Ursulin } 598b46a33e2STvrtko Ursulin 599b46a33e2STvrtko Ursulin static void i915_pmu_event_start(struct perf_event *event, int flags) 600b46a33e2STvrtko Ursulin { 601b46a33e2STvrtko Ursulin i915_pmu_enable(event); 602b46a33e2STvrtko Ursulin event->hw.state = 0; 603b46a33e2STvrtko Ursulin } 604b46a33e2STvrtko Ursulin 605b46a33e2STvrtko Ursulin static void i915_pmu_event_stop(struct perf_event *event, int flags) 606b46a33e2STvrtko Ursulin { 607b46a33e2STvrtko Ursulin if (flags & PERF_EF_UPDATE) 608b46a33e2STvrtko Ursulin i915_pmu_event_read(event); 609b46a33e2STvrtko Ursulin i915_pmu_disable(event); 610b46a33e2STvrtko Ursulin event->hw.state = PERF_HES_STOPPED; 611b46a33e2STvrtko Ursulin } 612b46a33e2STvrtko Ursulin 613b46a33e2STvrtko Ursulin static int i915_pmu_event_add(struct perf_event *event, int flags) 614b46a33e2STvrtko Ursulin { 615b46a33e2STvrtko Ursulin if (flags & PERF_EF_START) 616b46a33e2STvrtko Ursulin i915_pmu_event_start(event, flags); 617b46a33e2STvrtko Ursulin 618b46a33e2STvrtko Ursulin return 0; 619b46a33e2STvrtko Ursulin } 620b46a33e2STvrtko Ursulin 621b46a33e2STvrtko Ursulin static void i915_pmu_event_del(struct perf_event *event, int flags) 622b46a33e2STvrtko Ursulin { 623b46a33e2STvrtko Ursulin i915_pmu_event_stop(event, PERF_EF_UPDATE); 624b46a33e2STvrtko Ursulin } 625b46a33e2STvrtko Ursulin 626b46a33e2STvrtko Ursulin static int i915_pmu_event_event_idx(struct perf_event *event) 627b46a33e2STvrtko Ursulin { 628b46a33e2STvrtko Ursulin return 0; 629b46a33e2STvrtko Ursulin } 630b46a33e2STvrtko Ursulin 631b7d3aabfSChris Wilson struct i915_str_attribute { 632b7d3aabfSChris Wilson struct device_attribute attr; 633b7d3aabfSChris Wilson const char *str; 634b7d3aabfSChris Wilson }; 635b7d3aabfSChris Wilson 636b46a33e2STvrtko Ursulin static ssize_t i915_pmu_format_show(struct device *dev, 637b46a33e2STvrtko Ursulin struct device_attribute *attr, char *buf) 638b46a33e2STvrtko Ursulin { 639b7d3aabfSChris Wilson struct i915_str_attribute *eattr; 640b46a33e2STvrtko Ursulin 641b7d3aabfSChris Wilson eattr = container_of(attr, struct i915_str_attribute, attr); 642b7d3aabfSChris Wilson return sprintf(buf, "%s\n", eattr->str); 643b46a33e2STvrtko Ursulin } 644b46a33e2STvrtko Ursulin 645b46a33e2STvrtko Ursulin #define I915_PMU_FORMAT_ATTR(_name, _config) \ 646b7d3aabfSChris Wilson (&((struct i915_str_attribute[]) { \ 647b46a33e2STvrtko Ursulin { .attr = __ATTR(_name, 0444, i915_pmu_format_show, NULL), \ 648b7d3aabfSChris Wilson .str = _config, } \ 649b46a33e2STvrtko Ursulin })[0].attr.attr) 650b46a33e2STvrtko Ursulin 651b46a33e2STvrtko Ursulin static struct attribute *i915_pmu_format_attrs[] = { 652b46a33e2STvrtko Ursulin I915_PMU_FORMAT_ATTR(i915_eventid, "config:0-20"), 653b46a33e2STvrtko Ursulin NULL, 654b46a33e2STvrtko Ursulin }; 655b46a33e2STvrtko Ursulin 656b46a33e2STvrtko Ursulin static const struct attribute_group i915_pmu_format_attr_group = { 657b46a33e2STvrtko Ursulin .name = "format", 658b46a33e2STvrtko Ursulin .attrs = i915_pmu_format_attrs, 659b46a33e2STvrtko Ursulin }; 660b46a33e2STvrtko Ursulin 661b7d3aabfSChris Wilson struct i915_ext_attribute { 662b7d3aabfSChris Wilson struct device_attribute attr; 663b7d3aabfSChris Wilson unsigned long val; 664b7d3aabfSChris Wilson }; 665b7d3aabfSChris Wilson 666b46a33e2STvrtko Ursulin static ssize_t i915_pmu_event_show(struct device *dev, 667b46a33e2STvrtko Ursulin struct device_attribute *attr, char *buf) 668b46a33e2STvrtko Ursulin { 669b7d3aabfSChris Wilson struct i915_ext_attribute *eattr; 670b46a33e2STvrtko Ursulin 671b7d3aabfSChris Wilson eattr = container_of(attr, struct i915_ext_attribute, attr); 672b7d3aabfSChris Wilson return sprintf(buf, "config=0x%lx\n", eattr->val); 673b46a33e2STvrtko Ursulin } 674b46a33e2STvrtko Ursulin 675109ec558STvrtko Ursulin static struct attribute_group i915_pmu_events_attr_group = { 676b46a33e2STvrtko Ursulin .name = "events", 677109ec558STvrtko Ursulin /* Patch in attrs at runtime. */ 678b46a33e2STvrtko Ursulin }; 679b46a33e2STvrtko Ursulin 680b46a33e2STvrtko Ursulin static ssize_t 681b46a33e2STvrtko Ursulin i915_pmu_get_attr_cpumask(struct device *dev, 682b46a33e2STvrtko Ursulin struct device_attribute *attr, 683b46a33e2STvrtko Ursulin char *buf) 684b46a33e2STvrtko Ursulin { 685b46a33e2STvrtko Ursulin return cpumap_print_to_pagebuf(true, buf, &i915_pmu_cpumask); 686b46a33e2STvrtko Ursulin } 687b46a33e2STvrtko Ursulin 688b46a33e2STvrtko Ursulin static DEVICE_ATTR(cpumask, 0444, i915_pmu_get_attr_cpumask, NULL); 689b46a33e2STvrtko Ursulin 690b46a33e2STvrtko Ursulin static struct attribute *i915_cpumask_attrs[] = { 691b46a33e2STvrtko Ursulin &dev_attr_cpumask.attr, 692b46a33e2STvrtko Ursulin NULL, 693b46a33e2STvrtko Ursulin }; 694b46a33e2STvrtko Ursulin 695109ec558STvrtko Ursulin static const struct attribute_group i915_pmu_cpumask_attr_group = { 696b46a33e2STvrtko Ursulin .attrs = i915_cpumask_attrs, 697b46a33e2STvrtko Ursulin }; 698b46a33e2STvrtko Ursulin 699b46a33e2STvrtko Ursulin static const struct attribute_group *i915_pmu_attr_groups[] = { 700b46a33e2STvrtko Ursulin &i915_pmu_format_attr_group, 701b46a33e2STvrtko Ursulin &i915_pmu_events_attr_group, 702b46a33e2STvrtko Ursulin &i915_pmu_cpumask_attr_group, 703b46a33e2STvrtko Ursulin NULL 704b46a33e2STvrtko Ursulin }; 705b46a33e2STvrtko Ursulin 706109ec558STvrtko Ursulin #define __event(__config, __name, __unit) \ 707109ec558STvrtko Ursulin { \ 708109ec558STvrtko Ursulin .config = (__config), \ 709109ec558STvrtko Ursulin .name = (__name), \ 710109ec558STvrtko Ursulin .unit = (__unit), \ 711109ec558STvrtko Ursulin } 712109ec558STvrtko Ursulin 713109ec558STvrtko Ursulin #define __engine_event(__sample, __name) \ 714109ec558STvrtko Ursulin { \ 715109ec558STvrtko Ursulin .sample = (__sample), \ 716109ec558STvrtko Ursulin .name = (__name), \ 717109ec558STvrtko Ursulin } 718109ec558STvrtko Ursulin 719109ec558STvrtko Ursulin static struct i915_ext_attribute * 720109ec558STvrtko Ursulin add_i915_attr(struct i915_ext_attribute *attr, const char *name, u64 config) 721109ec558STvrtko Ursulin { 7222bbba4e9SChris Wilson sysfs_attr_init(&attr->attr.attr); 723109ec558STvrtko Ursulin attr->attr.attr.name = name; 724109ec558STvrtko Ursulin attr->attr.attr.mode = 0444; 725109ec558STvrtko Ursulin attr->attr.show = i915_pmu_event_show; 726109ec558STvrtko Ursulin attr->val = config; 727109ec558STvrtko Ursulin 728109ec558STvrtko Ursulin return ++attr; 729109ec558STvrtko Ursulin } 730109ec558STvrtko Ursulin 731109ec558STvrtko Ursulin static struct perf_pmu_events_attr * 732109ec558STvrtko Ursulin add_pmu_attr(struct perf_pmu_events_attr *attr, const char *name, 733109ec558STvrtko Ursulin const char *str) 734109ec558STvrtko Ursulin { 7352bbba4e9SChris Wilson sysfs_attr_init(&attr->attr.attr); 736109ec558STvrtko Ursulin attr->attr.attr.name = name; 737109ec558STvrtko Ursulin attr->attr.attr.mode = 0444; 738109ec558STvrtko Ursulin attr->attr.show = perf_event_sysfs_show; 739109ec558STvrtko Ursulin attr->event_str = str; 740109ec558STvrtko Ursulin 741109ec558STvrtko Ursulin return ++attr; 742109ec558STvrtko Ursulin } 743109ec558STvrtko Ursulin 744109ec558STvrtko Ursulin static struct attribute ** 745109ec558STvrtko Ursulin create_event_attributes(struct drm_i915_private *i915) 746109ec558STvrtko Ursulin { 747109ec558STvrtko Ursulin static const struct { 748109ec558STvrtko Ursulin u64 config; 749109ec558STvrtko Ursulin const char *name; 750109ec558STvrtko Ursulin const char *unit; 751109ec558STvrtko Ursulin } events[] = { 752109ec558STvrtko Ursulin __event(I915_PMU_ACTUAL_FREQUENCY, "actual-frequency", "MHz"), 753109ec558STvrtko Ursulin __event(I915_PMU_REQUESTED_FREQUENCY, "requested-frequency", "MHz"), 754109ec558STvrtko Ursulin __event(I915_PMU_INTERRUPTS, "interrupts", NULL), 755109ec558STvrtko Ursulin __event(I915_PMU_RC6_RESIDENCY, "rc6-residency", "ns"), 756109ec558STvrtko Ursulin }; 757109ec558STvrtko Ursulin static const struct { 758109ec558STvrtko Ursulin enum drm_i915_pmu_engine_sample sample; 759109ec558STvrtko Ursulin char *name; 760109ec558STvrtko Ursulin } engine_events[] = { 761109ec558STvrtko Ursulin __engine_event(I915_SAMPLE_BUSY, "busy"), 762109ec558STvrtko Ursulin __engine_event(I915_SAMPLE_SEMA, "sema"), 763109ec558STvrtko Ursulin __engine_event(I915_SAMPLE_WAIT, "wait"), 764109ec558STvrtko Ursulin }; 765109ec558STvrtko Ursulin unsigned int count = 0; 766109ec558STvrtko Ursulin struct perf_pmu_events_attr *pmu_attr = NULL, *pmu_iter; 767109ec558STvrtko Ursulin struct i915_ext_attribute *i915_attr = NULL, *i915_iter; 768109ec558STvrtko Ursulin struct attribute **attr = NULL, **attr_iter; 769109ec558STvrtko Ursulin struct intel_engine_cs *engine; 770109ec558STvrtko Ursulin enum intel_engine_id id; 771109ec558STvrtko Ursulin unsigned int i; 772109ec558STvrtko Ursulin 773109ec558STvrtko Ursulin /* Count how many counters we will be exposing. */ 774109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(events); i++) { 775109ec558STvrtko Ursulin if (!config_status(i915, events[i].config)) 776109ec558STvrtko Ursulin count++; 777109ec558STvrtko Ursulin } 778109ec558STvrtko Ursulin 779109ec558STvrtko Ursulin for_each_engine(engine, i915, id) { 780109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(engine_events); i++) { 781109ec558STvrtko Ursulin if (!engine_event_status(engine, 782109ec558STvrtko Ursulin engine_events[i].sample)) 783109ec558STvrtko Ursulin count++; 784109ec558STvrtko Ursulin } 785109ec558STvrtko Ursulin } 786109ec558STvrtko Ursulin 787109ec558STvrtko Ursulin /* Allocate attribute objects and table. */ 788*dd5fec87STvrtko Ursulin i915_attr = kcalloc(count, sizeof(*i915_attr), GFP_KERNEL); 789109ec558STvrtko Ursulin if (!i915_attr) 790109ec558STvrtko Ursulin goto err_alloc; 791109ec558STvrtko Ursulin 792*dd5fec87STvrtko Ursulin pmu_attr = kcalloc(count, sizeof(*pmu_attr), GFP_KERNEL); 793109ec558STvrtko Ursulin if (!pmu_attr) 794109ec558STvrtko Ursulin goto err_alloc; 795109ec558STvrtko Ursulin 796109ec558STvrtko Ursulin /* Max one pointer of each attribute type plus a termination entry. */ 797*dd5fec87STvrtko Ursulin attr = kcalloc(count * 2 + 1, sizeof(*attr), GFP_KERNEL); 798109ec558STvrtko Ursulin if (!attr) 799109ec558STvrtko Ursulin goto err_alloc; 800109ec558STvrtko Ursulin 801109ec558STvrtko Ursulin i915_iter = i915_attr; 802109ec558STvrtko Ursulin pmu_iter = pmu_attr; 803109ec558STvrtko Ursulin attr_iter = attr; 804109ec558STvrtko Ursulin 805109ec558STvrtko Ursulin /* Initialize supported non-engine counters. */ 806109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(events); i++) { 807109ec558STvrtko Ursulin char *str; 808109ec558STvrtko Ursulin 809109ec558STvrtko Ursulin if (config_status(i915, events[i].config)) 810109ec558STvrtko Ursulin continue; 811109ec558STvrtko Ursulin 812109ec558STvrtko Ursulin str = kstrdup(events[i].name, GFP_KERNEL); 813109ec558STvrtko Ursulin if (!str) 814109ec558STvrtko Ursulin goto err; 815109ec558STvrtko Ursulin 816109ec558STvrtko Ursulin *attr_iter++ = &i915_iter->attr.attr; 817109ec558STvrtko Ursulin i915_iter = add_i915_attr(i915_iter, str, events[i].config); 818109ec558STvrtko Ursulin 819109ec558STvrtko Ursulin if (events[i].unit) { 820109ec558STvrtko Ursulin str = kasprintf(GFP_KERNEL, "%s.unit", events[i].name); 821109ec558STvrtko Ursulin if (!str) 822109ec558STvrtko Ursulin goto err; 823109ec558STvrtko Ursulin 824109ec558STvrtko Ursulin *attr_iter++ = &pmu_iter->attr.attr; 825109ec558STvrtko Ursulin pmu_iter = add_pmu_attr(pmu_iter, str, events[i].unit); 826109ec558STvrtko Ursulin } 827109ec558STvrtko Ursulin } 828109ec558STvrtko Ursulin 829109ec558STvrtko Ursulin /* Initialize supported engine counters. */ 830109ec558STvrtko Ursulin for_each_engine(engine, i915, id) { 831109ec558STvrtko Ursulin for (i = 0; i < ARRAY_SIZE(engine_events); i++) { 832109ec558STvrtko Ursulin char *str; 833109ec558STvrtko Ursulin 834109ec558STvrtko Ursulin if (engine_event_status(engine, 835109ec558STvrtko Ursulin engine_events[i].sample)) 836109ec558STvrtko Ursulin continue; 837109ec558STvrtko Ursulin 838109ec558STvrtko Ursulin str = kasprintf(GFP_KERNEL, "%s-%s", 839109ec558STvrtko Ursulin engine->name, engine_events[i].name); 840109ec558STvrtko Ursulin if (!str) 841109ec558STvrtko Ursulin goto err; 842109ec558STvrtko Ursulin 843109ec558STvrtko Ursulin *attr_iter++ = &i915_iter->attr.attr; 844109ec558STvrtko Ursulin i915_iter = 845109ec558STvrtko Ursulin add_i915_attr(i915_iter, str, 846109ec558STvrtko Ursulin __I915_PMU_ENGINE(engine->class, 847109ec558STvrtko Ursulin engine->instance, 848109ec558STvrtko Ursulin engine_events[i].sample)); 849109ec558STvrtko Ursulin 850109ec558STvrtko Ursulin str = kasprintf(GFP_KERNEL, "%s-%s.unit", 851109ec558STvrtko Ursulin engine->name, engine_events[i].name); 852109ec558STvrtko Ursulin if (!str) 853109ec558STvrtko Ursulin goto err; 854109ec558STvrtko Ursulin 855109ec558STvrtko Ursulin *attr_iter++ = &pmu_iter->attr.attr; 856109ec558STvrtko Ursulin pmu_iter = add_pmu_attr(pmu_iter, str, "ns"); 857109ec558STvrtko Ursulin } 858109ec558STvrtko Ursulin } 859109ec558STvrtko Ursulin 860109ec558STvrtko Ursulin i915->pmu.i915_attr = i915_attr; 861109ec558STvrtko Ursulin i915->pmu.pmu_attr = pmu_attr; 862109ec558STvrtko Ursulin 863109ec558STvrtko Ursulin return attr; 864109ec558STvrtko Ursulin 865109ec558STvrtko Ursulin err:; 866109ec558STvrtko Ursulin for (attr_iter = attr; *attr_iter; attr_iter++) 867109ec558STvrtko Ursulin kfree((*attr_iter)->name); 868109ec558STvrtko Ursulin 869109ec558STvrtko Ursulin err_alloc: 870109ec558STvrtko Ursulin kfree(attr); 871109ec558STvrtko Ursulin kfree(i915_attr); 872109ec558STvrtko Ursulin kfree(pmu_attr); 873109ec558STvrtko Ursulin 874109ec558STvrtko Ursulin return NULL; 875109ec558STvrtko Ursulin } 876109ec558STvrtko Ursulin 877109ec558STvrtko Ursulin static void free_event_attributes(struct drm_i915_private *i915) 878109ec558STvrtko Ursulin { 879109ec558STvrtko Ursulin struct attribute **attr_iter = i915_pmu_events_attr_group.attrs; 880109ec558STvrtko Ursulin 881109ec558STvrtko Ursulin for (; *attr_iter; attr_iter++) 882109ec558STvrtko Ursulin kfree((*attr_iter)->name); 883109ec558STvrtko Ursulin 884109ec558STvrtko Ursulin kfree(i915_pmu_events_attr_group.attrs); 885109ec558STvrtko Ursulin kfree(i915->pmu.i915_attr); 886109ec558STvrtko Ursulin kfree(i915->pmu.pmu_attr); 887109ec558STvrtko Ursulin 888109ec558STvrtko Ursulin i915_pmu_events_attr_group.attrs = NULL; 889109ec558STvrtko Ursulin i915->pmu.i915_attr = NULL; 890109ec558STvrtko Ursulin i915->pmu.pmu_attr = NULL; 891109ec558STvrtko Ursulin } 892109ec558STvrtko Ursulin 893b46a33e2STvrtko Ursulin static int i915_pmu_cpu_online(unsigned int cpu, struct hlist_node *node) 894b46a33e2STvrtko Ursulin { 895b46a33e2STvrtko Ursulin struct i915_pmu *pmu = hlist_entry_safe(node, typeof(*pmu), node); 896b46a33e2STvrtko Ursulin 897b46a33e2STvrtko Ursulin GEM_BUG_ON(!pmu->base.event_init); 898b46a33e2STvrtko Ursulin 899b46a33e2STvrtko Ursulin /* Select the first online CPU as a designated reader. */ 9000426c046STvrtko Ursulin if (!cpumask_weight(&i915_pmu_cpumask)) 901b46a33e2STvrtko Ursulin cpumask_set_cpu(cpu, &i915_pmu_cpumask); 902b46a33e2STvrtko Ursulin 903b46a33e2STvrtko Ursulin return 0; 904b46a33e2STvrtko Ursulin } 905b46a33e2STvrtko Ursulin 906b46a33e2STvrtko Ursulin static int i915_pmu_cpu_offline(unsigned int cpu, struct hlist_node *node) 907b46a33e2STvrtko Ursulin { 908b46a33e2STvrtko Ursulin struct i915_pmu *pmu = hlist_entry_safe(node, typeof(*pmu), node); 909b46a33e2STvrtko Ursulin unsigned int target; 910b46a33e2STvrtko Ursulin 911b46a33e2STvrtko Ursulin GEM_BUG_ON(!pmu->base.event_init); 912b46a33e2STvrtko Ursulin 913b46a33e2STvrtko Ursulin if (cpumask_test_and_clear_cpu(cpu, &i915_pmu_cpumask)) { 914b46a33e2STvrtko Ursulin target = cpumask_any_but(topology_sibling_cpumask(cpu), cpu); 915b46a33e2STvrtko Ursulin /* Migrate events if there is a valid target */ 916b46a33e2STvrtko Ursulin if (target < nr_cpu_ids) { 917b46a33e2STvrtko Ursulin cpumask_set_cpu(target, &i915_pmu_cpumask); 918b46a33e2STvrtko Ursulin perf_pmu_migrate_context(&pmu->base, cpu, target); 919b46a33e2STvrtko Ursulin } 920b46a33e2STvrtko Ursulin } 921b46a33e2STvrtko Ursulin 922b46a33e2STvrtko Ursulin return 0; 923b46a33e2STvrtko Ursulin } 924b46a33e2STvrtko Ursulin 925b46a33e2STvrtko Ursulin static enum cpuhp_state cpuhp_slot = CPUHP_INVALID; 926b46a33e2STvrtko Ursulin 927b46a33e2STvrtko Ursulin static int i915_pmu_register_cpuhp_state(struct drm_i915_private *i915) 928b46a33e2STvrtko Ursulin { 929b46a33e2STvrtko Ursulin enum cpuhp_state slot; 930b46a33e2STvrtko Ursulin int ret; 931b46a33e2STvrtko Ursulin 932b46a33e2STvrtko Ursulin ret = cpuhp_setup_state_multi(CPUHP_AP_ONLINE_DYN, 933b46a33e2STvrtko Ursulin "perf/x86/intel/i915:online", 934b46a33e2STvrtko Ursulin i915_pmu_cpu_online, 935b46a33e2STvrtko Ursulin i915_pmu_cpu_offline); 936b46a33e2STvrtko Ursulin if (ret < 0) 937b46a33e2STvrtko Ursulin return ret; 938b46a33e2STvrtko Ursulin 939b46a33e2STvrtko Ursulin slot = ret; 940b46a33e2STvrtko Ursulin ret = cpuhp_state_add_instance(slot, &i915->pmu.node); 941b46a33e2STvrtko Ursulin if (ret) { 942b46a33e2STvrtko Ursulin cpuhp_remove_multi_state(slot); 943b46a33e2STvrtko Ursulin return ret; 944b46a33e2STvrtko Ursulin } 945b46a33e2STvrtko Ursulin 946b46a33e2STvrtko Ursulin cpuhp_slot = slot; 947b46a33e2STvrtko Ursulin return 0; 948b46a33e2STvrtko Ursulin } 949b46a33e2STvrtko Ursulin 950b46a33e2STvrtko Ursulin static void i915_pmu_unregister_cpuhp_state(struct drm_i915_private *i915) 951b46a33e2STvrtko Ursulin { 952b46a33e2STvrtko Ursulin WARN_ON(cpuhp_slot == CPUHP_INVALID); 953b46a33e2STvrtko Ursulin WARN_ON(cpuhp_state_remove_instance(cpuhp_slot, &i915->pmu.node)); 954b46a33e2STvrtko Ursulin cpuhp_remove_multi_state(cpuhp_slot); 955b46a33e2STvrtko Ursulin } 956b46a33e2STvrtko Ursulin 957b46a33e2STvrtko Ursulin void i915_pmu_register(struct drm_i915_private *i915) 958b46a33e2STvrtko Ursulin { 959b3add01eSTvrtko Ursulin struct intel_engine_cs *engine; 960b3add01eSTvrtko Ursulin enum intel_engine_id id; 961b46a33e2STvrtko Ursulin int ret; 962b46a33e2STvrtko Ursulin 963b46a33e2STvrtko Ursulin if (INTEL_GEN(i915) <= 2) { 964b46a33e2STvrtko Ursulin DRM_INFO("PMU not supported for this GPU."); 965b46a33e2STvrtko Ursulin return; 966b46a33e2STvrtko Ursulin } 967b46a33e2STvrtko Ursulin 968109ec558STvrtko Ursulin i915_pmu_events_attr_group.attrs = create_event_attributes(i915); 969109ec558STvrtko Ursulin if (!i915_pmu_events_attr_group.attrs) { 970109ec558STvrtko Ursulin ret = -ENOMEM; 971109ec558STvrtko Ursulin goto err; 972109ec558STvrtko Ursulin } 973109ec558STvrtko Ursulin 974b46a33e2STvrtko Ursulin i915->pmu.base.attr_groups = i915_pmu_attr_groups; 975b46a33e2STvrtko Ursulin i915->pmu.base.task_ctx_nr = perf_invalid_context; 976b46a33e2STvrtko Ursulin i915->pmu.base.event_init = i915_pmu_event_init; 977b46a33e2STvrtko Ursulin i915->pmu.base.add = i915_pmu_event_add; 978b46a33e2STvrtko Ursulin i915->pmu.base.del = i915_pmu_event_del; 979b46a33e2STvrtko Ursulin i915->pmu.base.start = i915_pmu_event_start; 980b46a33e2STvrtko Ursulin i915->pmu.base.stop = i915_pmu_event_stop; 981b46a33e2STvrtko Ursulin i915->pmu.base.read = i915_pmu_event_read; 982b46a33e2STvrtko Ursulin i915->pmu.base.event_idx = i915_pmu_event_event_idx; 983b46a33e2STvrtko Ursulin 984b46a33e2STvrtko Ursulin spin_lock_init(&i915->pmu.lock); 985b46a33e2STvrtko Ursulin hrtimer_init(&i915->pmu.timer, CLOCK_MONOTONIC, HRTIMER_MODE_REL); 986b46a33e2STvrtko Ursulin i915->pmu.timer.function = i915_sample; 987b46a33e2STvrtko Ursulin 988b3add01eSTvrtko Ursulin for_each_engine(engine, i915, id) 989b3add01eSTvrtko Ursulin INIT_DELAYED_WORK(&engine->pmu.disable_busy_stats, 990b3add01eSTvrtko Ursulin __disable_busy_stats); 991b3add01eSTvrtko Ursulin 992b46a33e2STvrtko Ursulin ret = perf_pmu_register(&i915->pmu.base, "i915", -1); 993b46a33e2STvrtko Ursulin if (ret) 994b46a33e2STvrtko Ursulin goto err; 995b46a33e2STvrtko Ursulin 996b46a33e2STvrtko Ursulin ret = i915_pmu_register_cpuhp_state(i915); 997b46a33e2STvrtko Ursulin if (ret) 998b46a33e2STvrtko Ursulin goto err_unreg; 999b46a33e2STvrtko Ursulin 1000b46a33e2STvrtko Ursulin return; 1001b46a33e2STvrtko Ursulin 1002b46a33e2STvrtko Ursulin err_unreg: 1003b46a33e2STvrtko Ursulin perf_pmu_unregister(&i915->pmu.base); 1004b46a33e2STvrtko Ursulin err: 1005b46a33e2STvrtko Ursulin i915->pmu.base.event_init = NULL; 1006109ec558STvrtko Ursulin free_event_attributes(i915); 1007b46a33e2STvrtko Ursulin DRM_NOTE("Failed to register PMU! (err=%d)\n", ret); 1008b46a33e2STvrtko Ursulin } 1009b46a33e2STvrtko Ursulin 1010b46a33e2STvrtko Ursulin void i915_pmu_unregister(struct drm_i915_private *i915) 1011b46a33e2STvrtko Ursulin { 1012b3add01eSTvrtko Ursulin struct intel_engine_cs *engine; 1013b3add01eSTvrtko Ursulin enum intel_engine_id id; 1014b3add01eSTvrtko Ursulin 1015b46a33e2STvrtko Ursulin if (!i915->pmu.base.event_init) 1016b46a33e2STvrtko Ursulin return; 1017b46a33e2STvrtko Ursulin 1018b46a33e2STvrtko Ursulin WARN_ON(i915->pmu.enable); 1019b46a33e2STvrtko Ursulin 1020b46a33e2STvrtko Ursulin hrtimer_cancel(&i915->pmu.timer); 1021b46a33e2STvrtko Ursulin 1022b3add01eSTvrtko Ursulin for_each_engine(engine, i915, id) { 1023b3add01eSTvrtko Ursulin GEM_BUG_ON(engine->pmu.busy_stats); 1024b3add01eSTvrtko Ursulin flush_delayed_work(&engine->pmu.disable_busy_stats); 1025b3add01eSTvrtko Ursulin } 1026b3add01eSTvrtko Ursulin 1027b46a33e2STvrtko Ursulin i915_pmu_unregister_cpuhp_state(i915); 1028b46a33e2STvrtko Ursulin 1029b46a33e2STvrtko Ursulin perf_pmu_unregister(&i915->pmu.base); 1030b46a33e2STvrtko Ursulin i915->pmu.base.event_init = NULL; 1031109ec558STvrtko Ursulin free_event_attributes(i915); 1032b46a33e2STvrtko Ursulin } 1033