blob: 2d3681bbb5225429608b70811c18d97aca780344 [file] [log] [blame]
Ingo Molnar241771e2008-12-03 10:39:53 +01001/*
2 * Performance counter x86 architecture code
3 *
4 * Copyright(C) 2008 Thomas Gleixner <tglx@linutronix.de>
5 * Copyright(C) 2008 Red Hat, Inc., Ingo Molnar
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +05306 * Copyright(C) 2009 Jaswinder Singh Rajput
Robert Richter39d81ea2009-04-29 12:47:05 +02007 * Copyright(C) 2009 Advanced Micro Devices, Inc., Robert Richter
Ingo Molnar241771e2008-12-03 10:39:53 +01008 *
9 * For licencing details see kernel-base/COPYING
10 */
11
12#include <linux/perf_counter.h>
13#include <linux/capability.h>
14#include <linux/notifier.h>
15#include <linux/hardirq.h>
16#include <linux/kprobes.h>
Thomas Gleixner4ac13292008-12-09 21:43:39 +010017#include <linux/module.h>
Ingo Molnar241771e2008-12-03 10:39:53 +010018#include <linux/kdebug.h>
19#include <linux/sched.h>
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +020020#include <linux/uaccess.h>
Ingo Molnar241771e2008-12-03 10:39:53 +010021
Ingo Molnar241771e2008-12-03 10:39:53 +010022#include <asm/apic.h>
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +020023#include <asm/stacktrace.h>
Peter Zijlstra4e935e42009-03-30 19:07:16 +020024#include <asm/nmi.h>
Ingo Molnar241771e2008-12-03 10:39:53 +010025
Ingo Molnar862a1a52008-12-17 13:09:20 +010026static u64 perf_counter_mask __read_mostly;
Ingo Molnar703e9372008-12-17 10:51:15 +010027
Ingo Molnar241771e2008-12-03 10:39:53 +010028struct cpu_hw_counters {
Ingo Molnar862a1a52008-12-17 13:09:20 +010029 struct perf_counter *counters[X86_PMC_IDX_MAX];
30 unsigned long used[BITS_TO_LONGS(X86_PMC_IDX_MAX)];
Robert Richter93904962009-04-29 12:47:15 +020031 unsigned long active[BITS_TO_LONGS(X86_PMC_IDX_MAX)];
Mike Galbraith4b39fd92009-01-23 14:36:16 +010032 unsigned long interrupts;
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010033 u64 throttle_ctrl;
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010034 int enabled;
Ingo Molnar241771e2008-12-03 10:39:53 +010035};
36
37/*
Robert Richter5f4ec282009-04-29 12:47:04 +020038 * struct x86_pmu - generic x86 pmu
Ingo Molnar241771e2008-12-03 10:39:53 +010039 */
Robert Richter5f4ec282009-04-29 12:47:04 +020040struct x86_pmu {
Robert Richterfaa28ae2009-04-29 12:47:13 +020041 const char *name;
42 int version;
Robert Richter39d81ea2009-04-29 12:47:05 +020043 int (*handle_irq)(struct pt_regs *, int);
Jaswinder Singh Rajput169e41e2009-02-28 18:37:49 +053044 u64 (*save_disable_all)(void);
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010045 void (*restore_all)(u64);
Robert Richter7c90cc42009-04-29 12:47:18 +020046 void (*enable)(struct hw_perf_counter *, int);
Robert Richterd4369892009-04-29 12:47:19 +020047 void (*disable)(struct hw_perf_counter *, int);
Jaswinder Singh Rajput169e41e2009-02-28 18:37:49 +053048 unsigned eventsel;
49 unsigned perfctr;
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010050 u64 (*event_map)(int);
51 u64 (*raw_event)(u64);
Jaswinder Singh Rajput169e41e2009-02-28 18:37:49 +053052 int max_events;
Robert Richter0933e5c2009-04-29 12:47:12 +020053 int num_counters;
54 int num_counters_fixed;
55 int counter_bits;
56 u64 counter_mask;
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +053057};
58
Robert Richter4a06bd82009-04-29 12:47:11 +020059static struct x86_pmu x86_pmu __read_mostly;
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +053060
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010061static DEFINE_PER_CPU(struct cpu_hw_counters, cpu_hw_counters) = {
62 .enabled = 1,
63};
Ingo Molnar241771e2008-12-03 10:39:53 +010064
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +053065/*
66 * Intel PerfMon v3. Used on Core2 and later.
67 */
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010068static const u64 intel_perfmon_event_map[] =
Ingo Molnar241771e2008-12-03 10:39:53 +010069{
Ingo Molnarf650a672008-12-23 12:17:29 +010070 [PERF_COUNT_CPU_CYCLES] = 0x003c,
Ingo Molnar241771e2008-12-03 10:39:53 +010071 [PERF_COUNT_INSTRUCTIONS] = 0x00c0,
72 [PERF_COUNT_CACHE_REFERENCES] = 0x4f2e,
73 [PERF_COUNT_CACHE_MISSES] = 0x412e,
74 [PERF_COUNT_BRANCH_INSTRUCTIONS] = 0x00c4,
75 [PERF_COUNT_BRANCH_MISSES] = 0x00c5,
Ingo Molnarf650a672008-12-23 12:17:29 +010076 [PERF_COUNT_BUS_CYCLES] = 0x013c,
Ingo Molnar241771e2008-12-03 10:39:53 +010077};
78
Robert Richter5f4ec282009-04-29 12:47:04 +020079static u64 intel_pmu_event_map(int event)
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +053080{
81 return intel_perfmon_event_map[event];
82}
Ingo Molnar241771e2008-12-03 10:39:53 +010083
Robert Richter5f4ec282009-04-29 12:47:04 +020084static u64 intel_pmu_raw_event(u64 event)
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010085{
Peter Zijlstra82bae4f82009-03-13 12:21:31 +010086#define CORE_EVNTSEL_EVENT_MASK 0x000000FFULL
87#define CORE_EVNTSEL_UNIT_MASK 0x0000FF00ULL
88#define CORE_EVNTSEL_COUNTER_MASK 0xFF000000ULL
Peter Zijlstrab0f3f282009-03-05 18:08:27 +010089
90#define CORE_EVNTSEL_MASK \
91 (CORE_EVNTSEL_EVENT_MASK | \
92 CORE_EVNTSEL_UNIT_MASK | \
93 CORE_EVNTSEL_COUNTER_MASK)
94
95 return event & CORE_EVNTSEL_MASK;
96}
97
Ingo Molnar241771e2008-12-03 10:39:53 +010098/*
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +053099 * AMD Performance Monitor K7 and later.
100 */
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100101static const u64 amd_perfmon_event_map[] =
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530102{
103 [PERF_COUNT_CPU_CYCLES] = 0x0076,
104 [PERF_COUNT_INSTRUCTIONS] = 0x00c0,
105 [PERF_COUNT_CACHE_REFERENCES] = 0x0080,
106 [PERF_COUNT_CACHE_MISSES] = 0x0081,
107 [PERF_COUNT_BRANCH_INSTRUCTIONS] = 0x00c4,
108 [PERF_COUNT_BRANCH_MISSES] = 0x00c5,
109};
110
Robert Richter5f4ec282009-04-29 12:47:04 +0200111static u64 amd_pmu_event_map(int event)
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530112{
113 return amd_perfmon_event_map[event];
114}
115
Robert Richter5f4ec282009-04-29 12:47:04 +0200116static u64 amd_pmu_raw_event(u64 event)
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100117{
Peter Zijlstra82bae4f82009-03-13 12:21:31 +0100118#define K7_EVNTSEL_EVENT_MASK 0x7000000FFULL
119#define K7_EVNTSEL_UNIT_MASK 0x00000FF00ULL
120#define K7_EVNTSEL_COUNTER_MASK 0x0FF000000ULL
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100121
122#define K7_EVNTSEL_MASK \
123 (K7_EVNTSEL_EVENT_MASK | \
124 K7_EVNTSEL_UNIT_MASK | \
125 K7_EVNTSEL_COUNTER_MASK)
126
127 return event & K7_EVNTSEL_MASK;
128}
129
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530130/*
Ingo Molnaree060942008-12-13 09:00:03 +0100131 * Propagate counter elapsed time into the generic counter.
132 * Can only be executed on the CPU where the counter is active.
133 * Returns the delta events processed.
134 */
135static void
136x86_perf_counter_update(struct perf_counter *counter,
137 struct hw_perf_counter *hwc, int idx)
138{
139 u64 prev_raw_count, new_raw_count, delta;
140
Ingo Molnaree060942008-12-13 09:00:03 +0100141 /*
142 * Careful: an NMI might modify the previous counter value.
143 *
144 * Our tactic to handle this is to first atomically read and
145 * exchange a new raw count - then add that new-prev delta
146 * count to the generic counter atomically:
147 */
148again:
149 prev_raw_count = atomic64_read(&hwc->prev_count);
150 rdmsrl(hwc->counter_base + idx, new_raw_count);
151
152 if (atomic64_cmpxchg(&hwc->prev_count, prev_raw_count,
153 new_raw_count) != prev_raw_count)
154 goto again;
155
156 /*
157 * Now we have the new raw value and have updated the prev
158 * timestamp already. We can now calculate the elapsed delta
159 * (counter-)time and add that to the generic counter.
160 *
161 * Careful, not all hw sign-extends above the physical width
162 * of the count, so we do that by clipping the delta to 32 bits:
163 */
164 delta = (u64)(u32)((s32)new_raw_count - (s32)prev_raw_count);
Ingo Molnaree060942008-12-13 09:00:03 +0100165
166 atomic64_add(delta, &counter->count);
167 atomic64_sub(delta, &hwc->period_left);
168}
169
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200170static atomic_t num_counters;
171static DEFINE_MUTEX(pmc_reserve_mutex);
172
173static bool reserve_pmc_hardware(void)
174{
175 int i;
176
177 if (nmi_watchdog == NMI_LOCAL_APIC)
178 disable_lapic_nmi_watchdog();
179
Robert Richter0933e5c2009-04-29 12:47:12 +0200180 for (i = 0; i < x86_pmu.num_counters; i++) {
Robert Richter4a06bd82009-04-29 12:47:11 +0200181 if (!reserve_perfctr_nmi(x86_pmu.perfctr + i))
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200182 goto perfctr_fail;
183 }
184
Robert Richter0933e5c2009-04-29 12:47:12 +0200185 for (i = 0; i < x86_pmu.num_counters; i++) {
Robert Richter4a06bd82009-04-29 12:47:11 +0200186 if (!reserve_evntsel_nmi(x86_pmu.eventsel + i))
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200187 goto eventsel_fail;
188 }
189
190 return true;
191
192eventsel_fail:
193 for (i--; i >= 0; i--)
Robert Richter4a06bd82009-04-29 12:47:11 +0200194 release_evntsel_nmi(x86_pmu.eventsel + i);
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200195
Robert Richter0933e5c2009-04-29 12:47:12 +0200196 i = x86_pmu.num_counters;
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200197
198perfctr_fail:
199 for (i--; i >= 0; i--)
Robert Richter4a06bd82009-04-29 12:47:11 +0200200 release_perfctr_nmi(x86_pmu.perfctr + i);
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200201
202 if (nmi_watchdog == NMI_LOCAL_APIC)
203 enable_lapic_nmi_watchdog();
204
205 return false;
206}
207
208static void release_pmc_hardware(void)
209{
210 int i;
211
Robert Richter0933e5c2009-04-29 12:47:12 +0200212 for (i = 0; i < x86_pmu.num_counters; i++) {
Robert Richter4a06bd82009-04-29 12:47:11 +0200213 release_perfctr_nmi(x86_pmu.perfctr + i);
214 release_evntsel_nmi(x86_pmu.eventsel + i);
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200215 }
216
217 if (nmi_watchdog == NMI_LOCAL_APIC)
218 enable_lapic_nmi_watchdog();
219}
220
221static void hw_perf_counter_destroy(struct perf_counter *counter)
222{
223 if (atomic_dec_and_mutex_lock(&num_counters, &pmc_reserve_mutex)) {
224 release_pmc_hardware();
225 mutex_unlock(&pmc_reserve_mutex);
226 }
227}
228
Robert Richter85cf9db2009-04-29 12:47:20 +0200229static inline int x86_pmu_initialized(void)
230{
231 return x86_pmu.handle_irq != NULL;
232}
233
Ingo Molnaree060942008-12-13 09:00:03 +0100234/*
Ingo Molnar241771e2008-12-03 10:39:53 +0100235 * Setup the hardware configuration for a given hw_event_type
236 */
Ingo Molnar621a01e2008-12-11 12:46:46 +0100237static int __hw_perf_counter_init(struct perf_counter *counter)
Ingo Molnar241771e2008-12-03 10:39:53 +0100238{
Ingo Molnar9f66a382008-12-10 12:33:23 +0100239 struct perf_counter_hw_event *hw_event = &counter->hw_event;
Ingo Molnar241771e2008-12-03 10:39:53 +0100240 struct hw_perf_counter *hwc = &counter->hw;
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200241 int err;
Ingo Molnar241771e2008-12-03 10:39:53 +0100242
Robert Richter39d81ea2009-04-29 12:47:05 +0200243 /* disable temporarily */
244 if (boot_cpu_data.x86_vendor == X86_VENDOR_AMD)
245 return -ENOSYS;
246
Robert Richter85cf9db2009-04-29 12:47:20 +0200247 if (!x86_pmu_initialized())
248 return -ENODEV;
Ingo Molnar241771e2008-12-03 10:39:53 +0100249
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200250 err = 0;
251 if (atomic_inc_not_zero(&num_counters)) {
252 mutex_lock(&pmc_reserve_mutex);
253 if (atomic_read(&num_counters) == 0 && !reserve_pmc_hardware())
254 err = -EBUSY;
255 else
256 atomic_inc(&num_counters);
257 mutex_unlock(&pmc_reserve_mutex);
258 }
259 if (err)
260 return err;
261
Ingo Molnar241771e2008-12-03 10:39:53 +0100262 /*
Paul Mackerras0475f9e2009-02-11 14:35:35 +1100263 * Generate PMC IRQs:
Ingo Molnar241771e2008-12-03 10:39:53 +0100264 * (keep 'enabled' bit clear for now)
265 */
Paul Mackerras0475f9e2009-02-11 14:35:35 +1100266 hwc->config = ARCH_PERFMON_EVENTSEL_INT;
Ingo Molnar241771e2008-12-03 10:39:53 +0100267
268 /*
Paul Mackerras0475f9e2009-02-11 14:35:35 +1100269 * Count user and OS events unless requested not to.
270 */
271 if (!hw_event->exclude_user)
272 hwc->config |= ARCH_PERFMON_EVENTSEL_USR;
273 if (!hw_event->exclude_kernel)
274 hwc->config |= ARCH_PERFMON_EVENTSEL_OS;
275
276 /*
277 * If privileged enough, allow NMI events:
Ingo Molnar241771e2008-12-03 10:39:53 +0100278 */
279 hwc->nmi = 0;
Paul Mackerras0475f9e2009-02-11 14:35:35 +1100280 if (capable(CAP_SYS_ADMIN) && hw_event->nmi)
281 hwc->nmi = 1;
Ingo Molnar241771e2008-12-03 10:39:53 +0100282
Ingo Molnar9f66a382008-12-10 12:33:23 +0100283 hwc->irq_period = hw_event->irq_period;
Ingo Molnar241771e2008-12-03 10:39:53 +0100284 /*
285 * Intel PMCs cannot be accessed sanely above 32 bit width,
286 * so we install an artificial 1<<31 period regardless of
287 * the generic counter period:
288 */
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530289 if (boot_cpu_data.x86_vendor == X86_VENDOR_INTEL)
290 if ((s64)hwc->irq_period <= 0 || hwc->irq_period > 0x7FFFFFFF)
291 hwc->irq_period = 0x7FFFFFFF;
Ingo Molnar241771e2008-12-03 10:39:53 +0100292
Ingo Molnaree060942008-12-13 09:00:03 +0100293 atomic64_set(&hwc->period_left, hwc->irq_period);
Ingo Molnar241771e2008-12-03 10:39:53 +0100294
295 /*
Thomas Gleixnerdfa7c892008-12-08 19:35:37 +0100296 * Raw event type provide the config in the event structure
Ingo Molnar241771e2008-12-03 10:39:53 +0100297 */
Peter Zijlstraf4a2deb42009-03-23 18:22:06 +0100298 if (perf_event_raw(hw_event)) {
Robert Richter4a06bd82009-04-29 12:47:11 +0200299 hwc->config |= x86_pmu.raw_event(perf_event_config(hw_event));
Ingo Molnar241771e2008-12-03 10:39:53 +0100300 } else {
Robert Richter4a06bd82009-04-29 12:47:11 +0200301 if (perf_event_id(hw_event) >= x86_pmu.max_events)
Ingo Molnar241771e2008-12-03 10:39:53 +0100302 return -EINVAL;
303 /*
304 * The generic map:
305 */
Robert Richter4a06bd82009-04-29 12:47:11 +0200306 hwc->config |= x86_pmu.event_map(perf_event_id(hw_event));
Ingo Molnar241771e2008-12-03 10:39:53 +0100307 }
Ingo Molnar241771e2008-12-03 10:39:53 +0100308
Peter Zijlstra4e935e42009-03-30 19:07:16 +0200309 counter->destroy = hw_perf_counter_destroy;
310
Ingo Molnar241771e2008-12-03 10:39:53 +0100311 return 0;
312}
313
Robert Richter5f4ec282009-04-29 12:47:04 +0200314static u64 intel_pmu_save_disable_all(void)
Thomas Gleixner4ac13292008-12-09 21:43:39 +0100315{
316 u64 ctrl;
317
318 rdmsrl(MSR_CORE_PERF_GLOBAL_CTRL, ctrl);
Ingo Molnar862a1a52008-12-17 13:09:20 +0100319 wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL, 0);
Ingo Molnar2b9ff0d2008-12-14 18:36:30 +0100320
Thomas Gleixner4ac13292008-12-09 21:43:39 +0100321 return ctrl;
322}
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530323
Robert Richter5f4ec282009-04-29 12:47:04 +0200324static u64 amd_pmu_save_disable_all(void)
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530325{
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100326 struct cpu_hw_counters *cpuc = &__get_cpu_var(cpu_hw_counters);
327 int enabled, idx;
328
329 enabled = cpuc->enabled;
330 cpuc->enabled = 0;
Peter Zijlstra60b3df92009-03-13 12:21:30 +0100331 /*
332 * ensure we write the disable before we start disabling the
Robert Richter5f4ec282009-04-29 12:47:04 +0200333 * counters proper, so that amd_pmu_enable_counter() does the
334 * right thing.
Peter Zijlstra60b3df92009-03-13 12:21:30 +0100335 */
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100336 barrier();
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530337
Robert Richter0933e5c2009-04-29 12:47:12 +0200338 for (idx = 0; idx < x86_pmu.num_counters; idx++) {
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100339 u64 val;
340
Robert Richter93904962009-04-29 12:47:15 +0200341 if (!test_bit(idx, cpuc->active))
Robert Richter4295ee62009-04-29 12:47:01 +0200342 continue;
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530343 rdmsrl(MSR_K7_EVNTSEL0 + idx, val);
Robert Richter4295ee62009-04-29 12:47:01 +0200344 if (!(val & ARCH_PERFMON_EVENTSEL0_ENABLE))
345 continue;
346 val &= ~ARCH_PERFMON_EVENTSEL0_ENABLE;
347 wrmsrl(MSR_K7_EVNTSEL0 + idx, val);
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530348 }
349
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100350 return enabled;
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530351}
352
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530353u64 hw_perf_save_disable(void)
354{
Robert Richter85cf9db2009-04-29 12:47:20 +0200355 if (!x86_pmu_initialized())
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530356 return 0;
Robert Richter4a06bd82009-04-29 12:47:11 +0200357 return x86_pmu.save_disable_all();
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530358}
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100359/*
360 * Exported because of ACPI idle
361 */
Ingo Molnar01b28382008-12-11 13:45:51 +0100362EXPORT_SYMBOL_GPL(hw_perf_save_disable);
Ingo Molnar241771e2008-12-03 10:39:53 +0100363
Robert Richter5f4ec282009-04-29 12:47:04 +0200364static void intel_pmu_restore_all(u64 ctrl)
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530365{
366 wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL, ctrl);
367}
368
Robert Richter5f4ec282009-04-29 12:47:04 +0200369static void amd_pmu_restore_all(u64 ctrl)
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530370{
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100371 struct cpu_hw_counters *cpuc = &__get_cpu_var(cpu_hw_counters);
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530372 int idx;
373
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100374 cpuc->enabled = ctrl;
375 barrier();
376 if (!ctrl)
377 return;
378
Robert Richter0933e5c2009-04-29 12:47:12 +0200379 for (idx = 0; idx < x86_pmu.num_counters; idx++) {
Robert Richter4295ee62009-04-29 12:47:01 +0200380 u64 val;
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100381
Robert Richter93904962009-04-29 12:47:15 +0200382 if (!test_bit(idx, cpuc->active))
Robert Richter4295ee62009-04-29 12:47:01 +0200383 continue;
384 rdmsrl(MSR_K7_EVNTSEL0 + idx, val);
385 if (val & ARCH_PERFMON_EVENTSEL0_ENABLE)
386 continue;
387 val |= ARCH_PERFMON_EVENTSEL0_ENABLE;
388 wrmsrl(MSR_K7_EVNTSEL0 + idx, val);
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530389 }
390}
391
Ingo Molnaree060942008-12-13 09:00:03 +0100392void hw_perf_restore(u64 ctrl)
393{
Robert Richter85cf9db2009-04-29 12:47:20 +0200394 if (!x86_pmu_initialized())
Ingo Molnar2b9ff0d2008-12-14 18:36:30 +0100395 return;
Robert Richter4a06bd82009-04-29 12:47:11 +0200396 x86_pmu.restore_all(ctrl);
Ingo Molnaree060942008-12-13 09:00:03 +0100397}
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100398/*
399 * Exported because of ACPI idle
400 */
Ingo Molnaree060942008-12-13 09:00:03 +0100401EXPORT_SYMBOL_GPL(hw_perf_restore);
402
Robert Richterb7f88592009-04-29 12:47:06 +0200403static inline u64 intel_pmu_get_status(u64 mask)
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100404{
405 u64 status;
406
407 rdmsrl(MSR_CORE_PERF_GLOBAL_STATUS, status);
408
409 return status;
410}
411
Robert Richterdee5d902009-04-29 12:47:07 +0200412static inline void intel_pmu_ack_status(u64 ack)
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100413{
414 wrmsrl(MSR_CORE_PERF_GLOBAL_OVF_CTRL, ack);
415}
416
Robert Richter7c90cc42009-04-29 12:47:18 +0200417static inline void x86_pmu_enable_counter(struct hw_perf_counter *hwc, int idx)
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100418{
Robert Richter7c90cc42009-04-29 12:47:18 +0200419 int err;
Robert Richter7c90cc42009-04-29 12:47:18 +0200420 err = checking_wrmsrl(hwc->config_base + idx,
421 hwc->config | ARCH_PERFMON_EVENTSEL0_ENABLE);
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100422}
423
Robert Richterd4369892009-04-29 12:47:19 +0200424static inline void x86_pmu_disable_counter(struct hw_perf_counter *hwc, int idx)
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100425{
Robert Richterd4369892009-04-29 12:47:19 +0200426 int err;
Robert Richterd4369892009-04-29 12:47:19 +0200427 err = checking_wrmsrl(hwc->config_base + idx,
428 hwc->config);
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100429}
430
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100431static inline void
Robert Richterd4369892009-04-29 12:47:19 +0200432intel_pmu_disable_fixed(struct hw_perf_counter *hwc, int __idx)
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100433{
434 int idx = __idx - X86_PMC_IDX_FIXED;
435 u64 ctrl_val, mask;
436 int err;
437
438 mask = 0xfULL << (idx * 4);
439
440 rdmsrl(hwc->config_base, ctrl_val);
441 ctrl_val &= ~mask;
442 err = checking_wrmsrl(hwc->config_base, ctrl_val);
443}
444
445static inline void
Robert Richterd4369892009-04-29 12:47:19 +0200446intel_pmu_disable_counter(struct hw_perf_counter *hwc, int idx)
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100447{
Robert Richterd4369892009-04-29 12:47:19 +0200448 if (unlikely(hwc->config_base == MSR_ARCH_PERFMON_FIXED_CTR_CTRL)) {
449 intel_pmu_disable_fixed(hwc, idx);
450 return;
451 }
452
453 x86_pmu_disable_counter(hwc, idx);
454}
455
456static inline void
457amd_pmu_disable_counter(struct hw_perf_counter *hwc, int idx)
458{
459 x86_pmu_disable_counter(hwc, idx);
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100460}
461
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100462static DEFINE_PER_CPU(u64, prev_left[X86_PMC_IDX_MAX]);
Ingo Molnar241771e2008-12-03 10:39:53 +0100463
Ingo Molnaree060942008-12-13 09:00:03 +0100464/*
465 * Set the next IRQ period, based on the hwc->period_left value.
466 * To be called with the counter disabled in hw:
467 */
468static void
Robert Richter26816c22009-04-29 12:47:08 +0200469x86_perf_counter_set_period(struct perf_counter *counter,
Ingo Molnaree060942008-12-13 09:00:03 +0100470 struct hw_perf_counter *hwc, int idx)
Ingo Molnar241771e2008-12-03 10:39:53 +0100471{
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100472 s64 left = atomic64_read(&hwc->period_left);
Peter Zijlstra595258a2009-03-13 12:21:28 +0100473 s64 period = hwc->irq_period;
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100474 int err;
Ingo Molnar241771e2008-12-03 10:39:53 +0100475
Ingo Molnaree060942008-12-13 09:00:03 +0100476 /*
477 * If we are way outside a reasoable range then just skip forward:
478 */
479 if (unlikely(left <= -period)) {
480 left = period;
481 atomic64_set(&hwc->period_left, left);
482 }
483
484 if (unlikely(left <= 0)) {
485 left += period;
486 atomic64_set(&hwc->period_left, left);
487 }
488
Ingo Molnaree060942008-12-13 09:00:03 +0100489 per_cpu(prev_left[idx], smp_processor_id()) = left;
490
491 /*
492 * The hw counter starts counting from this counter offset,
493 * mark it to be able to extra future deltas:
494 */
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100495 atomic64_set(&hwc->prev_count, (u64)-left);
Ingo Molnaree060942008-12-13 09:00:03 +0100496
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100497 err = checking_wrmsrl(hwc->counter_base + idx,
Robert Richter0933e5c2009-04-29 12:47:12 +0200498 (u64)(-left) & x86_pmu.counter_mask);
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100499}
500
501static inline void
Robert Richter7c90cc42009-04-29 12:47:18 +0200502intel_pmu_enable_fixed(struct hw_perf_counter *hwc, int __idx)
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100503{
504 int idx = __idx - X86_PMC_IDX_FIXED;
505 u64 ctrl_val, bits, mask;
506 int err;
507
508 /*
Paul Mackerras0475f9e2009-02-11 14:35:35 +1100509 * Enable IRQ generation (0x8),
510 * and enable ring-3 counting (0x2) and ring-0 counting (0x1)
511 * if requested:
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100512 */
Paul Mackerras0475f9e2009-02-11 14:35:35 +1100513 bits = 0x8ULL;
514 if (hwc->config & ARCH_PERFMON_EVENTSEL_USR)
515 bits |= 0x2;
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100516 if (hwc->config & ARCH_PERFMON_EVENTSEL_OS)
517 bits |= 0x1;
518 bits <<= (idx * 4);
519 mask = 0xfULL << (idx * 4);
520
521 rdmsrl(hwc->config_base, ctrl_val);
522 ctrl_val &= ~mask;
523 ctrl_val |= bits;
524 err = checking_wrmsrl(hwc->config_base, ctrl_val);
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100525}
526
Robert Richter7c90cc42009-04-29 12:47:18 +0200527static void intel_pmu_enable_counter(struct hw_perf_counter *hwc, int idx)
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100528{
Robert Richter7c90cc42009-04-29 12:47:18 +0200529 if (unlikely(hwc->config_base == MSR_ARCH_PERFMON_FIXED_CTR_CTRL)) {
530 intel_pmu_enable_fixed(hwc, idx);
531 return;
532 }
533
534 x86_pmu_enable_counter(hwc, idx);
535}
536
537static void amd_pmu_enable_counter(struct hw_perf_counter *hwc, int idx)
538{
539 struct cpu_hw_counters *cpuc = &__get_cpu_var(cpu_hw_counters);
540
541 if (cpuc->enabled)
542 x86_pmu_enable_counter(hwc, idx);
Jaswinder Singh Rajput2b583d82008-12-27 19:15:43 +0530543 else
Robert Richterd4369892009-04-29 12:47:19 +0200544 x86_pmu_disable_counter(hwc, idx);
Ingo Molnar241771e2008-12-03 10:39:53 +0100545}
546
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100547static int
548fixed_mode_idx(struct perf_counter *counter, struct hw_perf_counter *hwc)
Ingo Molnar862a1a52008-12-17 13:09:20 +0100549{
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100550 unsigned int event;
551
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530552 if (boot_cpu_data.x86_vendor == X86_VENDOR_AMD)
553 return -1;
554
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100555 if (unlikely(hwc->nmi))
556 return -1;
557
558 event = hwc->config & ARCH_PERFMON_EVENT_MASK;
559
Robert Richter4a06bd82009-04-29 12:47:11 +0200560 if (unlikely(event == x86_pmu.event_map(PERF_COUNT_INSTRUCTIONS)))
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100561 return X86_PMC_IDX_FIXED_INSTRUCTIONS;
Robert Richter4a06bd82009-04-29 12:47:11 +0200562 if (unlikely(event == x86_pmu.event_map(PERF_COUNT_CPU_CYCLES)))
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100563 return X86_PMC_IDX_FIXED_CPU_CYCLES;
Robert Richter4a06bd82009-04-29 12:47:11 +0200564 if (unlikely(event == x86_pmu.event_map(PERF_COUNT_BUS_CYCLES)))
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100565 return X86_PMC_IDX_FIXED_BUS_CYCLES;
566
Ingo Molnar862a1a52008-12-17 13:09:20 +0100567 return -1;
568}
569
Ingo Molnaree060942008-12-13 09:00:03 +0100570/*
571 * Find a PMC slot for the freshly enabled / scheduled in counter:
572 */
Robert Richter4aeb0b42009-04-29 12:47:03 +0200573static int x86_pmu_enable(struct perf_counter *counter)
Ingo Molnar241771e2008-12-03 10:39:53 +0100574{
575 struct cpu_hw_counters *cpuc = &__get_cpu_var(cpu_hw_counters);
576 struct hw_perf_counter *hwc = &counter->hw;
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100577 int idx;
Ingo Molnar241771e2008-12-03 10:39:53 +0100578
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100579 idx = fixed_mode_idx(counter, hwc);
580 if (idx >= 0) {
581 /*
582 * Try to get the fixed counter, if that is already taken
583 * then try to get a generic counter:
584 */
585 if (test_and_set_bit(idx, cpuc->used))
586 goto try_generic;
Ingo Molnar0dff86a2008-12-23 12:28:12 +0100587
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100588 hwc->config_base = MSR_ARCH_PERFMON_FIXED_CTR_CTRL;
589 /*
590 * We set it so that counter_base + idx in wrmsr/rdmsr maps to
591 * MSR_ARCH_PERFMON_FIXED_CTR0 ... CTR2:
592 */
593 hwc->counter_base =
594 MSR_ARCH_PERFMON_FIXED_CTR0 - X86_PMC_IDX_FIXED;
Ingo Molnar241771e2008-12-03 10:39:53 +0100595 hwc->idx = idx;
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100596 } else {
597 idx = hwc->idx;
598 /* Try to get the previous generic counter again */
599 if (test_and_set_bit(idx, cpuc->used)) {
600try_generic:
Robert Richter0933e5c2009-04-29 12:47:12 +0200601 idx = find_first_zero_bit(cpuc->used,
602 x86_pmu.num_counters);
603 if (idx == x86_pmu.num_counters)
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100604 return -EAGAIN;
605
606 set_bit(idx, cpuc->used);
607 hwc->idx = idx;
608 }
Robert Richter4a06bd82009-04-29 12:47:11 +0200609 hwc->config_base = x86_pmu.eventsel;
610 hwc->counter_base = x86_pmu.perfctr;
Ingo Molnar241771e2008-12-03 10:39:53 +0100611 }
612
613 perf_counters_lapic_init(hwc->nmi);
614
Robert Richterd4369892009-04-29 12:47:19 +0200615 x86_pmu.disable(hwc, idx);
Ingo Molnar241771e2008-12-03 10:39:53 +0100616
Ingo Molnar862a1a52008-12-17 13:09:20 +0100617 cpuc->counters[idx] = counter;
Robert Richter09534232009-04-29 12:47:16 +0200618 set_bit(idx, cpuc->active);
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100619
Robert Richter26816c22009-04-29 12:47:08 +0200620 x86_perf_counter_set_period(counter, hwc, idx);
Robert Richter7c90cc42009-04-29 12:47:18 +0200621 x86_pmu.enable(hwc, idx);
Ingo Molnar95cdd2e2008-12-21 13:50:42 +0100622
623 return 0;
Ingo Molnar241771e2008-12-03 10:39:53 +0100624}
625
626void perf_counter_print_debug(void)
627{
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100628 u64 ctrl, status, overflow, pmc_ctrl, pmc_count, prev_left, fixed;
Ingo Molnar0dff86a2008-12-23 12:28:12 +0100629 struct cpu_hw_counters *cpuc;
Ingo Molnar1e125672008-12-09 12:18:18 +0100630 int cpu, idx;
631
Robert Richter0933e5c2009-04-29 12:47:12 +0200632 if (!x86_pmu.num_counters)
Ingo Molnar1e125672008-12-09 12:18:18 +0100633 return;
Ingo Molnar241771e2008-12-03 10:39:53 +0100634
635 local_irq_disable();
636
637 cpu = smp_processor_id();
Ingo Molnar0dff86a2008-12-23 12:28:12 +0100638 cpuc = &per_cpu(cpu_hw_counters, cpu);
Ingo Molnar241771e2008-12-03 10:39:53 +0100639
Robert Richterfaa28ae2009-04-29 12:47:13 +0200640 if (x86_pmu.version >= 2) {
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530641 rdmsrl(MSR_CORE_PERF_GLOBAL_CTRL, ctrl);
642 rdmsrl(MSR_CORE_PERF_GLOBAL_STATUS, status);
643 rdmsrl(MSR_CORE_PERF_GLOBAL_OVF_CTRL, overflow);
644 rdmsrl(MSR_ARCH_PERFMON_FIXED_CTR_CTRL, fixed);
Ingo Molnar241771e2008-12-03 10:39:53 +0100645
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530646 pr_info("\n");
647 pr_info("CPU#%d: ctrl: %016llx\n", cpu, ctrl);
648 pr_info("CPU#%d: status: %016llx\n", cpu, status);
649 pr_info("CPU#%d: overflow: %016llx\n", cpu, overflow);
650 pr_info("CPU#%d: fixed: %016llx\n", cpu, fixed);
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530651 }
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530652 pr_info("CPU#%d: used: %016llx\n", cpu, *(u64 *)cpuc->used);
Ingo Molnar241771e2008-12-03 10:39:53 +0100653
Robert Richter0933e5c2009-04-29 12:47:12 +0200654 for (idx = 0; idx < x86_pmu.num_counters; idx++) {
Robert Richter4a06bd82009-04-29 12:47:11 +0200655 rdmsrl(x86_pmu.eventsel + idx, pmc_ctrl);
656 rdmsrl(x86_pmu.perfctr + idx, pmc_count);
Ingo Molnar241771e2008-12-03 10:39:53 +0100657
Ingo Molnaree060942008-12-13 09:00:03 +0100658 prev_left = per_cpu(prev_left[idx], cpu);
Ingo Molnar241771e2008-12-03 10:39:53 +0100659
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530660 pr_info("CPU#%d: gen-PMC%d ctrl: %016llx\n",
Ingo Molnar241771e2008-12-03 10:39:53 +0100661 cpu, idx, pmc_ctrl);
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530662 pr_info("CPU#%d: gen-PMC%d count: %016llx\n",
Ingo Molnar241771e2008-12-03 10:39:53 +0100663 cpu, idx, pmc_count);
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530664 pr_info("CPU#%d: gen-PMC%d left: %016llx\n",
Ingo Molnaree060942008-12-13 09:00:03 +0100665 cpu, idx, prev_left);
Ingo Molnar241771e2008-12-03 10:39:53 +0100666 }
Robert Richter0933e5c2009-04-29 12:47:12 +0200667 for (idx = 0; idx < x86_pmu.num_counters_fixed; idx++) {
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100668 rdmsrl(MSR_ARCH_PERFMON_FIXED_CTR0 + idx, pmc_count);
669
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530670 pr_info("CPU#%d: fixed-PMC%d count: %016llx\n",
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100671 cpu, idx, pmc_count);
672 }
Ingo Molnar241771e2008-12-03 10:39:53 +0100673 local_irq_enable();
674}
675
Robert Richter4aeb0b42009-04-29 12:47:03 +0200676static void x86_pmu_disable(struct perf_counter *counter)
Ingo Molnar241771e2008-12-03 10:39:53 +0100677{
678 struct cpu_hw_counters *cpuc = &__get_cpu_var(cpu_hw_counters);
679 struct hw_perf_counter *hwc = &counter->hw;
Robert Richter6f00cad2009-04-29 12:47:17 +0200680 int idx = hwc->idx;
Ingo Molnar241771e2008-12-03 10:39:53 +0100681
Robert Richter09534232009-04-29 12:47:16 +0200682 /*
683 * Must be done before we disable, otherwise the nmi handler
684 * could reenable again:
685 */
686 clear_bit(idx, cpuc->active);
Robert Richterd4369892009-04-29 12:47:19 +0200687 x86_pmu.disable(hwc, idx);
Ingo Molnar241771e2008-12-03 10:39:53 +0100688
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100689 /*
690 * Make sure the cleared pointer becomes visible before we
691 * (potentially) free the counter:
692 */
Robert Richter527e26a2009-04-29 12:47:02 +0200693 barrier();
Ingo Molnar241771e2008-12-03 10:39:53 +0100694
Ingo Molnaree060942008-12-13 09:00:03 +0100695 /*
696 * Drain the remaining delta count out of a counter
697 * that we are disabling:
698 */
699 x86_perf_counter_update(counter, hwc, idx);
Robert Richter09534232009-04-29 12:47:16 +0200700 cpuc->counters[idx] = NULL;
701 clear_bit(idx, cpuc->used);
Ingo Molnar241771e2008-12-03 10:39:53 +0100702}
703
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100704/*
Ingo Molnaree060942008-12-13 09:00:03 +0100705 * Save and restart an expired counter. Called by NMI contexts,
706 * so it has to be careful about preempting normal counter ops:
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100707 */
Robert Richter55de0f22009-04-29 12:47:09 +0200708static void intel_pmu_save_and_restart(struct perf_counter *counter)
Ingo Molnar241771e2008-12-03 10:39:53 +0100709{
710 struct hw_perf_counter *hwc = &counter->hw;
711 int idx = hwc->idx;
Ingo Molnar241771e2008-12-03 10:39:53 +0100712
Ingo Molnaree060942008-12-13 09:00:03 +0100713 x86_perf_counter_update(counter, hwc, idx);
Robert Richter26816c22009-04-29 12:47:08 +0200714 x86_perf_counter_set_period(counter, hwc, idx);
Ingo Molnar7e2ae342008-12-09 11:40:46 +0100715
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100716 if (counter->state == PERF_COUNTER_STATE_ACTIVE)
Robert Richter7c90cc42009-04-29 12:47:18 +0200717 intel_pmu_enable_counter(hwc, idx);
Ingo Molnar241771e2008-12-03 10:39:53 +0100718}
719
Ingo Molnar241771e2008-12-03 10:39:53 +0100720/*
Mike Galbraith4b39fd92009-01-23 14:36:16 +0100721 * Maximum interrupt frequency of 100KHz per CPU
722 */
Jaswinder Singh Rajput169e41e2009-02-28 18:37:49 +0530723#define PERFMON_MAX_INTERRUPTS (100000/HZ)
Mike Galbraith4b39fd92009-01-23 14:36:16 +0100724
725/*
Ingo Molnar241771e2008-12-03 10:39:53 +0100726 * This handler is triggered by the local APIC, so the APIC IRQ handling
727 * rules apply:
728 */
Robert Richter39d81ea2009-04-29 12:47:05 +0200729static int intel_pmu_handle_irq(struct pt_regs *regs, int nmi)
Ingo Molnar241771e2008-12-03 10:39:53 +0100730{
731 int bit, cpu = smp_processor_id();
Mike Galbraith4b39fd92009-01-23 14:36:16 +0100732 u64 ack, status;
Mike Galbraith1b023a92009-01-23 10:13:01 +0100733 struct cpu_hw_counters *cpuc = &per_cpu(cpu_hw_counters, cpu);
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100734 int ret = 0;
Ingo Molnar43874d22008-12-09 12:23:59 +0100735
Robert Richter55de0f22009-04-29 12:47:09 +0200736 cpuc->throttle_ctrl = intel_pmu_save_disable_all();
Ingo Molnar241771e2008-12-03 10:39:53 +0100737
Robert Richterb7f88592009-04-29 12:47:06 +0200738 status = intel_pmu_get_status(cpuc->throttle_ctrl);
Ingo Molnar87b9cf42008-12-08 14:20:16 +0100739 if (!status)
740 goto out;
741
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100742 ret = 1;
Ingo Molnar241771e2008-12-03 10:39:53 +0100743again:
Mike Galbraithd278c482009-02-09 07:38:50 +0100744 inc_irq_stat(apic_perf_irqs);
Ingo Molnar241771e2008-12-03 10:39:53 +0100745 ack = status;
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100746 for_each_bit(bit, (unsigned long *)&status, X86_PMC_IDX_MAX) {
Ingo Molnar862a1a52008-12-17 13:09:20 +0100747 struct perf_counter *counter = cpuc->counters[bit];
Ingo Molnar241771e2008-12-03 10:39:53 +0100748
749 clear_bit(bit, (unsigned long *) &status);
Robert Richter09534232009-04-29 12:47:16 +0200750 if (!test_bit(bit, cpuc->active))
Ingo Molnar241771e2008-12-03 10:39:53 +0100751 continue;
752
Robert Richter55de0f22009-04-29 12:47:09 +0200753 intel_pmu_save_and_restart(counter);
Peter Zijlstra78f13e92009-04-08 15:01:33 +0200754 if (perf_counter_overflow(counter, nmi, regs, 0))
Robert Richterd4369892009-04-29 12:47:19 +0200755 intel_pmu_disable_counter(&counter->hw, bit);
Ingo Molnar241771e2008-12-03 10:39:53 +0100756 }
757
Robert Richterdee5d902009-04-29 12:47:07 +0200758 intel_pmu_ack_status(ack);
Ingo Molnar241771e2008-12-03 10:39:53 +0100759
760 /*
761 * Repeat if there is more work to be done:
762 */
Robert Richterb7f88592009-04-29 12:47:06 +0200763 status = intel_pmu_get_status(cpuc->throttle_ctrl);
Ingo Molnar241771e2008-12-03 10:39:53 +0100764 if (status)
765 goto again;
Ingo Molnar87b9cf42008-12-08 14:20:16 +0100766out:
Ingo Molnar241771e2008-12-03 10:39:53 +0100767 /*
Mike Galbraith1b023a92009-01-23 10:13:01 +0100768 * Restore - do not reenable when global enable is off or throttled:
Ingo Molnar241771e2008-12-03 10:39:53 +0100769 */
Mike Galbraith4b39fd92009-01-23 14:36:16 +0100770 if (++cpuc->interrupts < PERFMON_MAX_INTERRUPTS)
Robert Richter55de0f22009-04-29 12:47:09 +0200771 intel_pmu_restore_all(cpuc->throttle_ctrl);
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100772
773 return ret;
Mike Galbraith1b023a92009-01-23 10:13:01 +0100774}
775
Robert Richter39d81ea2009-04-29 12:47:05 +0200776static int amd_pmu_handle_irq(struct pt_regs *regs, int nmi) { return 0; }
777
Mike Galbraith1b023a92009-01-23 10:13:01 +0100778void perf_counter_unthrottle(void)
779{
780 struct cpu_hw_counters *cpuc;
781
Robert Richter85cf9db2009-04-29 12:47:20 +0200782 if (!x86_pmu_initialized())
Mike Galbraith1b023a92009-01-23 10:13:01 +0100783 return;
784
Robert Richter85cf9db2009-04-29 12:47:20 +0200785 if (!cpu_has(&boot_cpu_data, X86_FEATURE_ARCH_PERFMON))
Mike Galbraith1b023a92009-01-23 10:13:01 +0100786 return;
787
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100788 cpuc = &__get_cpu_var(cpu_hw_counters);
Mike Galbraith4b39fd92009-01-23 14:36:16 +0100789 if (cpuc->interrupts >= PERFMON_MAX_INTERRUPTS) {
Mike Galbraith1b023a92009-01-23 10:13:01 +0100790 if (printk_ratelimit())
Mike Galbraith4b39fd92009-01-23 14:36:16 +0100791 printk(KERN_WARNING "PERFMON: max interrupts exceeded!\n");
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100792 hw_perf_restore(cpuc->throttle_ctrl);
Mike Galbraith1b023a92009-01-23 10:13:01 +0100793 }
Mike Galbraith4b39fd92009-01-23 14:36:16 +0100794 cpuc->interrupts = 0;
Ingo Molnar241771e2008-12-03 10:39:53 +0100795}
796
797void smp_perf_counter_interrupt(struct pt_regs *regs)
798{
799 irq_enter();
Ingo Molnar241771e2008-12-03 10:39:53 +0100800 apic_write(APIC_LVTPC, LOCAL_PERF_VECTOR);
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100801 ack_APIC_irq();
Robert Richter4a06bd82009-04-29 12:47:11 +0200802 x86_pmu.handle_irq(regs, 0);
Ingo Molnar241771e2008-12-03 10:39:53 +0100803 irq_exit();
804}
805
Peter Zijlstrab6276f32009-04-06 11:45:03 +0200806void smp_perf_pending_interrupt(struct pt_regs *regs)
807{
808 irq_enter();
809 ack_APIC_irq();
810 inc_irq_stat(apic_pending_irqs);
811 perf_counter_do_pending();
812 irq_exit();
813}
814
815void set_perf_counter_pending(void)
816{
817 apic->send_IPI_self(LOCAL_PENDING_VECTOR);
818}
819
Mike Galbraith3415dd92009-01-23 14:16:53 +0100820void perf_counters_lapic_init(int nmi)
Ingo Molnar241771e2008-12-03 10:39:53 +0100821{
822 u32 apic_val;
823
Robert Richter85cf9db2009-04-29 12:47:20 +0200824 if (!x86_pmu_initialized())
Ingo Molnar241771e2008-12-03 10:39:53 +0100825 return;
Robert Richter85cf9db2009-04-29 12:47:20 +0200826
Ingo Molnar241771e2008-12-03 10:39:53 +0100827 /*
828 * Enable the performance counter vector in the APIC LVT:
829 */
830 apic_val = apic_read(APIC_LVTERR);
831
832 apic_write(APIC_LVTERR, apic_val | APIC_LVT_MASKED);
833 if (nmi)
834 apic_write(APIC_LVTPC, APIC_DM_NMI);
835 else
836 apic_write(APIC_LVTPC, LOCAL_PERF_VECTOR);
837 apic_write(APIC_LVTERR, apic_val);
838}
839
840static int __kprobes
841perf_counter_nmi_handler(struct notifier_block *self,
842 unsigned long cmd, void *__args)
843{
844 struct die_args *args = __args;
845 struct pt_regs *regs;
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100846 int ret;
Ingo Molnar241771e2008-12-03 10:39:53 +0100847
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100848 switch (cmd) {
849 case DIE_NMI:
850 case DIE_NMI_IPI:
851 break;
852
853 default:
Ingo Molnar241771e2008-12-03 10:39:53 +0100854 return NOTIFY_DONE;
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100855 }
Ingo Molnar241771e2008-12-03 10:39:53 +0100856
857 regs = args->regs;
858
859 apic_write(APIC_LVTPC, APIC_DM_NMI);
Robert Richter4a06bd82009-04-29 12:47:11 +0200860 ret = x86_pmu.handle_irq(regs, 1);
Ingo Molnar241771e2008-12-03 10:39:53 +0100861
Peter Zijlstrab0f3f282009-03-05 18:08:27 +0100862 return ret ? NOTIFY_STOP : NOTIFY_OK;
Ingo Molnar241771e2008-12-03 10:39:53 +0100863}
864
865static __read_mostly struct notifier_block perf_counter_nmi_notifier = {
Mike Galbraith5b75af02009-02-04 17:11:34 +0100866 .notifier_call = perf_counter_nmi_handler,
867 .next = NULL,
868 .priority = 1
Ingo Molnar241771e2008-12-03 10:39:53 +0100869};
870
Robert Richter5f4ec282009-04-29 12:47:04 +0200871static struct x86_pmu intel_pmu = {
Robert Richterfaa28ae2009-04-29 12:47:13 +0200872 .name = "Intel",
Robert Richter39d81ea2009-04-29 12:47:05 +0200873 .handle_irq = intel_pmu_handle_irq,
Robert Richter5f4ec282009-04-29 12:47:04 +0200874 .save_disable_all = intel_pmu_save_disable_all,
875 .restore_all = intel_pmu_restore_all,
Robert Richter5f4ec282009-04-29 12:47:04 +0200876 .enable = intel_pmu_enable_counter,
877 .disable = intel_pmu_disable_counter,
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530878 .eventsel = MSR_ARCH_PERFMON_EVENTSEL0,
879 .perfctr = MSR_ARCH_PERFMON_PERFCTR0,
Robert Richter5f4ec282009-04-29 12:47:04 +0200880 .event_map = intel_pmu_event_map,
881 .raw_event = intel_pmu_raw_event,
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530882 .max_events = ARRAY_SIZE(intel_perfmon_event_map),
883};
884
Robert Richter5f4ec282009-04-29 12:47:04 +0200885static struct x86_pmu amd_pmu = {
Robert Richterfaa28ae2009-04-29 12:47:13 +0200886 .name = "AMD",
Robert Richter39d81ea2009-04-29 12:47:05 +0200887 .handle_irq = amd_pmu_handle_irq,
Robert Richter5f4ec282009-04-29 12:47:04 +0200888 .save_disable_all = amd_pmu_save_disable_all,
889 .restore_all = amd_pmu_restore_all,
Robert Richter5f4ec282009-04-29 12:47:04 +0200890 .enable = amd_pmu_enable_counter,
891 .disable = amd_pmu_disable_counter,
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530892 .eventsel = MSR_K7_EVNTSEL0,
893 .perfctr = MSR_K7_PERFCTR0,
Robert Richter5f4ec282009-04-29 12:47:04 +0200894 .event_map = amd_pmu_event_map,
895 .raw_event = amd_pmu_raw_event,
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530896 .max_events = ARRAY_SIZE(amd_perfmon_event_map),
Robert Richter0933e5c2009-04-29 12:47:12 +0200897 .num_counters = 4,
898 .counter_bits = 48,
899 .counter_mask = (1ULL << 48) - 1,
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530900};
901
Robert Richter72eae042009-04-29 12:47:10 +0200902static int intel_pmu_init(void)
Ingo Molnar241771e2008-12-03 10:39:53 +0100903{
Ingo Molnar703e9372008-12-17 10:51:15 +0100904 union cpuid10_edx edx;
Ingo Molnar7bb497b2009-03-18 08:59:21 +0100905 union cpuid10_eax eax;
906 unsigned int unused;
907 unsigned int ebx;
Robert Richterfaa28ae2009-04-29 12:47:13 +0200908 int version;
Ingo Molnar241771e2008-12-03 10:39:53 +0100909
Robert Richterda1a7762009-04-29 12:46:58 +0200910 if (!cpu_has(&boot_cpu_data, X86_FEATURE_ARCH_PERFMON))
Robert Richter72eae042009-04-29 12:47:10 +0200911 return -ENODEV;
Robert Richterda1a7762009-04-29 12:46:58 +0200912
Ingo Molnar241771e2008-12-03 10:39:53 +0100913 /*
914 * Check whether the Architectural PerfMon supports
915 * Branch Misses Retired Event or not.
916 */
Ingo Molnar703e9372008-12-17 10:51:15 +0100917 cpuid(10, &eax.full, &ebx, &unused, &edx.full);
Ingo Molnar241771e2008-12-03 10:39:53 +0100918 if (eax.split.mask_length <= ARCH_PERFMON_BRANCH_MISSES_RETIRED)
Robert Richter72eae042009-04-29 12:47:10 +0200919 return -ENODEV;
Ingo Molnar241771e2008-12-03 10:39:53 +0100920
Robert Richterfaa28ae2009-04-29 12:47:13 +0200921 version = eax.split.version_id;
922 if (version < 2)
Robert Richter72eae042009-04-29 12:47:10 +0200923 return -ENODEV;
Ingo Molnar7bb497b2009-03-18 08:59:21 +0100924
Robert Richter4a06bd82009-04-29 12:47:11 +0200925 x86_pmu = intel_pmu;
Robert Richterfaa28ae2009-04-29 12:47:13 +0200926 x86_pmu.version = version;
Robert Richter0933e5c2009-04-29 12:47:12 +0200927 x86_pmu.num_counters = eax.split.num_counters;
928 x86_pmu.num_counters_fixed = edx.split.num_counters_fixed;
929 x86_pmu.counter_bits = eax.split.bit_width;
930 x86_pmu.counter_mask = (1ULL << eax.split.bit_width) - 1;
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530931
Robert Richter72eae042009-04-29 12:47:10 +0200932 return 0;
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530933}
934
Robert Richter72eae042009-04-29 12:47:10 +0200935static int amd_pmu_init(void)
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530936{
Robert Richter4a06bd82009-04-29 12:47:11 +0200937 x86_pmu = amd_pmu;
Robert Richter72eae042009-04-29 12:47:10 +0200938 return 0;
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530939}
940
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530941void __init init_hw_perf_counters(void)
942{
Robert Richter72eae042009-04-29 12:47:10 +0200943 int err;
944
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530945 switch (boot_cpu_data.x86_vendor) {
946 case X86_VENDOR_INTEL:
Robert Richter72eae042009-04-29 12:47:10 +0200947 err = intel_pmu_init();
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530948 break;
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530949 case X86_VENDOR_AMD:
Robert Richter72eae042009-04-29 12:47:10 +0200950 err = amd_pmu_init();
Jaswinder Singh Rajputf87ad352009-02-27 20:15:14 +0530951 break;
Robert Richter41389602009-04-29 12:47:00 +0200952 default:
953 return;
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530954 }
Robert Richter72eae042009-04-29 12:47:10 +0200955 if (err != 0)
Jaswinder Singh Rajputb56a3802009-02-27 18:09:09 +0530956 return;
957
Robert Richterfaa28ae2009-04-29 12:47:13 +0200958 pr_info("%s Performance Monitoring support detected.\n", x86_pmu.name);
959 pr_info("... version: %d\n", x86_pmu.version);
960 pr_info("... bit width: %d\n", x86_pmu.counter_bits);
961
Robert Richter0933e5c2009-04-29 12:47:12 +0200962 pr_info("... num counters: %d\n", x86_pmu.num_counters);
963 if (x86_pmu.num_counters > X86_PMC_MAX_GENERIC) {
964 x86_pmu.num_counters = X86_PMC_MAX_GENERIC;
Ingo Molnar241771e2008-12-03 10:39:53 +0100965 WARN(1, KERN_ERR "hw perf counters %d > max(%d), clipping!",
Robert Richter0933e5c2009-04-29 12:47:12 +0200966 x86_pmu.num_counters, X86_PMC_MAX_GENERIC);
Ingo Molnar241771e2008-12-03 10:39:53 +0100967 }
Robert Richter0933e5c2009-04-29 12:47:12 +0200968 perf_counter_mask = (1 << x86_pmu.num_counters) - 1;
969 perf_max_counters = x86_pmu.num_counters;
Ingo Molnar241771e2008-12-03 10:39:53 +0100970
Robert Richter0933e5c2009-04-29 12:47:12 +0200971 pr_info("... value mask: %016Lx\n", x86_pmu.counter_mask);
Ingo Molnar2f18d1e2008-12-22 11:10:42 +0100972
Robert Richter0933e5c2009-04-29 12:47:12 +0200973 if (x86_pmu.num_counters_fixed > X86_PMC_MAX_FIXED) {
974 x86_pmu.num_counters_fixed = X86_PMC_MAX_FIXED;
Ingo Molnar703e9372008-12-17 10:51:15 +0100975 WARN(1, KERN_ERR "hw perf counters fixed %d > max(%d), clipping!",
Robert Richter0933e5c2009-04-29 12:47:12 +0200976 x86_pmu.num_counters_fixed, X86_PMC_MAX_FIXED);
Ingo Molnar703e9372008-12-17 10:51:15 +0100977 }
Robert Richter0933e5c2009-04-29 12:47:12 +0200978 pr_info("... fixed counters: %d\n", x86_pmu.num_counters_fixed);
Ingo Molnar241771e2008-12-03 10:39:53 +0100979
Robert Richter0933e5c2009-04-29 12:47:12 +0200980 perf_counter_mask |=
981 ((1LL << x86_pmu.num_counters_fixed)-1) << X86_PMC_IDX_FIXED;
Ingo Molnar862a1a52008-12-17 13:09:20 +0100982
Jaswinder Singh Rajputa1ef58f2009-02-28 18:45:39 +0530983 pr_info("... counter mask: %016Lx\n", perf_counter_mask);
Ingo Molnar75f224c2008-12-14 21:58:46 +0100984
Ingo Molnar241771e2008-12-03 10:39:53 +0100985 perf_counters_lapic_init(0);
986 register_die_notifier(&perf_counter_nmi_notifier);
Ingo Molnar241771e2008-12-03 10:39:53 +0100987}
Ingo Molnar621a01e2008-12-11 12:46:46 +0100988
Robert Richterbb775fc2009-04-29 12:47:14 +0200989static inline void x86_pmu_read(struct perf_counter *counter)
Ingo Molnaree060942008-12-13 09:00:03 +0100990{
991 x86_perf_counter_update(counter, &counter->hw, counter->hw.idx);
992}
993
Robert Richter4aeb0b42009-04-29 12:47:03 +0200994static const struct pmu pmu = {
995 .enable = x86_pmu_enable,
996 .disable = x86_pmu_disable,
997 .read = x86_pmu_read,
Ingo Molnar621a01e2008-12-11 12:46:46 +0100998};
999
Robert Richter4aeb0b42009-04-29 12:47:03 +02001000const struct pmu *hw_perf_counter_init(struct perf_counter *counter)
Ingo Molnar621a01e2008-12-11 12:46:46 +01001001{
1002 int err;
1003
1004 err = __hw_perf_counter_init(counter);
1005 if (err)
Peter Zijlstra9ea98e12009-03-30 19:07:09 +02001006 return ERR_PTR(err);
Ingo Molnar621a01e2008-12-11 12:46:46 +01001007
Robert Richter4aeb0b42009-04-29 12:47:03 +02001008 return &pmu;
Ingo Molnar621a01e2008-12-11 12:46:46 +01001009}
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +02001010
1011/*
1012 * callchain support
1013 */
1014
1015static inline
1016void callchain_store(struct perf_callchain_entry *entry, unsigned long ip)
1017{
1018 if (entry->nr < MAX_STACK_DEPTH)
1019 entry->ip[entry->nr++] = ip;
1020}
1021
1022static DEFINE_PER_CPU(struct perf_callchain_entry, irq_entry);
1023static DEFINE_PER_CPU(struct perf_callchain_entry, nmi_entry);
1024
1025
1026static void
1027backtrace_warning_symbol(void *data, char *msg, unsigned long symbol)
1028{
1029 /* Ignore warnings */
1030}
1031
1032static void backtrace_warning(void *data, char *msg)
1033{
1034 /* Ignore warnings */
1035}
1036
1037static int backtrace_stack(void *data, char *name)
1038{
1039 /* Don't bother with IRQ stacks for now */
1040 return -1;
1041}
1042
1043static void backtrace_address(void *data, unsigned long addr, int reliable)
1044{
1045 struct perf_callchain_entry *entry = data;
1046
1047 if (reliable)
1048 callchain_store(entry, addr);
1049}
1050
1051static const struct stacktrace_ops backtrace_ops = {
1052 .warning = backtrace_warning,
1053 .warning_symbol = backtrace_warning_symbol,
1054 .stack = backtrace_stack,
1055 .address = backtrace_address,
1056};
1057
1058static void
1059perf_callchain_kernel(struct pt_regs *regs, struct perf_callchain_entry *entry)
1060{
1061 unsigned long bp;
1062 char *stack;
Peter Zijlstra5872bdb82009-04-02 11:12:03 +02001063 int nr = entry->nr;
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +02001064
1065 callchain_store(entry, instruction_pointer(regs));
1066
1067 stack = ((char *)regs + sizeof(struct pt_regs));
1068#ifdef CONFIG_FRAME_POINTER
1069 bp = frame_pointer(regs);
1070#else
1071 bp = 0;
1072#endif
1073
1074 dump_trace(NULL, regs, (void *)stack, bp, &backtrace_ops, entry);
Peter Zijlstra5872bdb82009-04-02 11:12:03 +02001075
1076 entry->kernel = entry->nr - nr;
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +02001077}
1078
1079
1080struct stack_frame {
1081 const void __user *next_fp;
1082 unsigned long return_address;
1083};
1084
1085static int copy_stack_frame(const void __user *fp, struct stack_frame *frame)
1086{
1087 int ret;
1088
1089 if (!access_ok(VERIFY_READ, fp, sizeof(*frame)))
1090 return 0;
1091
1092 ret = 1;
1093 pagefault_disable();
1094 if (__copy_from_user_inatomic(frame, fp, sizeof(*frame)))
1095 ret = 0;
1096 pagefault_enable();
1097
1098 return ret;
1099}
1100
1101static void
1102perf_callchain_user(struct pt_regs *regs, struct perf_callchain_entry *entry)
1103{
1104 struct stack_frame frame;
1105 const void __user *fp;
Peter Zijlstra5872bdb82009-04-02 11:12:03 +02001106 int nr = entry->nr;
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +02001107
1108 regs = (struct pt_regs *)current->thread.sp0 - 1;
1109 fp = (void __user *)regs->bp;
1110
1111 callchain_store(entry, regs->ip);
1112
1113 while (entry->nr < MAX_STACK_DEPTH) {
1114 frame.next_fp = NULL;
1115 frame.return_address = 0;
1116
1117 if (!copy_stack_frame(fp, &frame))
1118 break;
1119
1120 if ((unsigned long)fp < user_stack_pointer(regs))
1121 break;
1122
1123 callchain_store(entry, frame.return_address);
1124 fp = frame.next_fp;
1125 }
Peter Zijlstra5872bdb82009-04-02 11:12:03 +02001126
1127 entry->user = entry->nr - nr;
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +02001128}
1129
1130static void
1131perf_do_callchain(struct pt_regs *regs, struct perf_callchain_entry *entry)
1132{
1133 int is_user;
1134
1135 if (!regs)
1136 return;
1137
1138 is_user = user_mode(regs);
1139
1140 if (!current || current->pid == 0)
1141 return;
1142
1143 if (is_user && current->state != TASK_RUNNING)
1144 return;
1145
1146 if (!is_user)
1147 perf_callchain_kernel(regs, entry);
1148
1149 if (current->mm)
1150 perf_callchain_user(regs, entry);
1151}
1152
1153struct perf_callchain_entry *perf_callchain(struct pt_regs *regs)
1154{
1155 struct perf_callchain_entry *entry;
1156
1157 if (in_nmi())
1158 entry = &__get_cpu_var(nmi_entry);
1159 else
1160 entry = &__get_cpu_var(irq_entry);
1161
1162 entry->nr = 0;
Peter Zijlstra5872bdb82009-04-02 11:12:03 +02001163 entry->hv = 0;
1164 entry->kernel = 0;
1165 entry->user = 0;
Peter Zijlstrad7d59fb2009-03-30 19:07:15 +02001166
1167 perf_do_callchain(regs, entry);
1168
1169 return entry;
1170}