blob: e159254fb7cdc7d255c36c653981c223194e3965 [file] [log] [blame]
Paolo Ciarrocchid4413732008-02-19 23:51:27 +01001/*
Robert Richter6852fd92008-07-22 21:09:08 +02002 * @file op_model_amd.c
Barry Kasindorfbd87f1f2007-12-18 18:05:58 +01003 * athlon / K7 / K8 / Family 10h model-specific MSR operations
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
Robert Richterae735e92008-12-25 17:26:07 +01005 * @remark Copyright 2002-2009 OProfile authors
Linus Torvalds1da177e2005-04-16 15:20:36 -07006 * @remark Read the file COPYING
7 *
8 * @author John Levon
9 * @author Philippe Elie
10 * @author Graydon Hoare
Robert Richteradf5ec02008-07-22 21:08:48 +020011 * @author Robert Richter <robert.richter@amd.com>
Jason Yeh4d4036e2009-07-08 13:49:38 +020012 * @author Barry Kasindorf <barry.kasindorf@amd.com>
13 * @author Jason Yeh <jason.yeh@amd.com>
14 * @author Suravee Suthikulpanit <suravee.suthikulpanit@amd.com>
Robert Richterae735e92008-12-25 17:26:07 +010015 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070016
17#include <linux/oprofile.h>
Barry Kasindorf56784f12008-07-22 21:08:55 +020018#include <linux/device.h>
19#include <linux/pci.h>
Jason Yeh4d4036e2009-07-08 13:49:38 +020020#include <linux/percpu.h>
Barry Kasindorf56784f12008-07-22 21:08:55 +020021
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include <asm/ptrace.h>
23#include <asm/msr.h>
Don Zickus3e4ff112006-06-26 13:57:01 +020024#include <asm/nmi.h>
Robert Richter013cfc52010-01-28 18:05:26 +010025#include <asm/apic.h>
Robert Richter64683da2010-02-04 10:57:23 +010026#include <asm/processor.h>
27#include <asm/cpufeature.h>
Paolo Ciarrocchid4413732008-02-19 23:51:27 +010028
Linus Torvalds1da177e2005-04-16 15:20:36 -070029#include "op_x86_model.h"
30#include "op_counter.h"
31
Robert Richter4c168ea2008-09-24 11:08:52 +020032#define NUM_COUNTERS 4
Jason Yeh4d4036e2009-07-08 13:49:38 +020033#ifdef CONFIG_OPROFILE_EVENT_MULTIPLEX
34#define NUM_VIRT_COUNTERS 32
Jason Yeh4d4036e2009-07-08 13:49:38 +020035#else
36#define NUM_VIRT_COUNTERS NUM_COUNTERS
Jason Yeh4d4036e2009-07-08 13:49:38 +020037#endif
38
Robert Richter3370d352009-05-25 15:10:32 +020039#define OP_EVENT_MASK 0x0FFF
Robert Richter42399ad2009-05-25 17:59:06 +020040#define OP_CTR_OVERFLOW (1ULL<<31)
Robert Richter3370d352009-05-25 15:10:32 +020041
42#define MSR_AMD_EVENTSEL_RESERVED ((0xFFFFFCF0ULL<<32)|(1ULL<<21))
Linus Torvalds1da177e2005-04-16 15:20:36 -070043
Jason Yeh4d4036e2009-07-08 13:49:38 +020044static unsigned long reset_value[NUM_VIRT_COUNTERS];
Robert Richter852402c2008-07-22 21:09:06 +020045
Robert Richterc572ae42009-06-03 20:10:39 +020046#define IBS_FETCH_SIZE 6
47#define IBS_OP_SIZE 12
Barry Kasindorf56784f12008-07-22 21:08:55 +020048
Robert Richter64683da2010-02-04 10:57:23 +010049static u32 ibs_caps;
Barry Kasindorf56784f12008-07-22 21:08:55 +020050
51struct op_ibs_config {
52 unsigned long op_enabled;
53 unsigned long fetch_enabled;
54 unsigned long max_cnt_fetch;
55 unsigned long max_cnt_op;
56 unsigned long rand_en;
57 unsigned long dispatched_ops;
58};
59
60static struct op_ibs_config ibs_config;
Robert Richterba520782010-02-23 15:46:49 +010061static u64 ibs_op_ctl;
Paolo Ciarrocchid4413732008-02-19 23:51:27 +010062
Robert Richter64683da2010-02-04 10:57:23 +010063/*
64 * IBS cpuid feature detection
65 */
66
67#define IBS_CPUID_FEATURES 0x8000001b
68
69/*
70 * Same bit mask as for IBS cpuid feature flags (Fn8000_001B_EAX), but
71 * bit 0 is used to indicate the existence of IBS.
72 */
73#define IBS_CAPS_AVAIL (1LL<<0)
Robert Richterba520782010-02-23 15:46:49 +010074#define IBS_CAPS_RDWROPCNT (1LL<<3)
Robert Richter64683da2010-02-04 10:57:23 +010075#define IBS_CAPS_OPCNT (1LL<<4)
76
Robert Richterba520782010-02-23 15:46:49 +010077/*
78 * IBS randomization macros
79 */
80#define IBS_RANDOM_BITS 12
81#define IBS_RANDOM_MASK ((1ULL << IBS_RANDOM_BITS) - 1)
82#define IBS_RANDOM_MAXCNT_OFFSET (1ULL << (IBS_RANDOM_BITS - 5))
83
Robert Richter64683da2010-02-04 10:57:23 +010084static u32 get_ibs_caps(void)
85{
86 u32 ibs_caps;
87 unsigned int max_level;
88
89 if (!boot_cpu_has(X86_FEATURE_IBS))
90 return 0;
91
92 /* check IBS cpuid feature flags */
93 max_level = cpuid_eax(0x80000000);
94 if (max_level < IBS_CPUID_FEATURES)
95 return IBS_CAPS_AVAIL;
96
97 ibs_caps = cpuid_eax(IBS_CPUID_FEATURES);
98 if (!(ibs_caps & IBS_CAPS_AVAIL))
99 /* cpuid flags not valid */
100 return IBS_CAPS_AVAIL;
101
102 return ibs_caps;
103}
104
Suravee Suthikulpanitf125be12010-01-18 11:25:45 -0600105/*
106 * 16-bit Linear Feedback Shift Register (LFSR)
107 *
108 * 16 14 13 11
109 * Feedback polynomial = X + X + X + X + 1
110 */
111static unsigned int lfsr_random(void)
112{
113 static unsigned int lfsr_value = 0xF00D;
114 unsigned int bit;
115
116 /* Compute next bit to shift in */
117 bit = ((lfsr_value >> 0) ^
118 (lfsr_value >> 2) ^
119 (lfsr_value >> 3) ^
120 (lfsr_value >> 5)) & 0x0001;
121
122 /* Advance to next register value */
123 lfsr_value = (lfsr_value >> 1) | (bit << 15);
124
125 return lfsr_value;
126}
127
Robert Richterba520782010-02-23 15:46:49 +0100128/*
129 * IBS software randomization
130 *
131 * The IBS periodic op counter is randomized in software. The lower 12
132 * bits of the 20 bit counter are randomized. IbsOpCurCnt is
133 * initialized with a 12 bit random value.
134 */
135static inline u64 op_amd_randomize_ibs_op(u64 val)
136{
137 unsigned int random = lfsr_random();
138
139 if (!(ibs_caps & IBS_CAPS_RDWROPCNT))
140 /*
141 * Work around if the hw can not write to IbsOpCurCnt
142 *
143 * Randomize the lower 8 bits of the 16 bit
144 * IbsOpMaxCnt [15:0] value in the range of -128 to
145 * +127 by adding/subtracting an offset to the
146 * maximum count (IbsOpMaxCnt).
147 *
148 * To avoid over or underflows and protect upper bits
149 * starting at bit 16, the initial value for
150 * IbsOpMaxCnt must fit in the range from 0x0081 to
151 * 0xff80.
152 */
153 val += (s8)(random >> 4);
154 else
155 val |= (u64)(random & IBS_RANDOM_MASK) << 32;
156
157 return val;
158}
159
Andrew Morton4680e642009-06-23 12:36:08 -0700160static inline void
Robert Richter7939d2b2008-07-22 21:08:56 +0200161op_amd_handle_ibs(struct pt_regs * const regs,
162 struct op_msrs const * const msrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163{
Robert Richterc572ae42009-06-03 20:10:39 +0200164 u64 val, ctl;
Robert Richter1acda872009-01-05 10:35:31 +0100165 struct op_entry entry;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166
Robert Richter64683da2010-02-04 10:57:23 +0100167 if (!ibs_caps)
Andrew Morton4680e642009-06-23 12:36:08 -0700168 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169
Robert Richter7939d2b2008-07-22 21:08:56 +0200170 if (ibs_config.fetch_enabled) {
Robert Richterc572ae42009-06-03 20:10:39 +0200171 rdmsrl(MSR_AMD64_IBSFETCHCTL, ctl);
172 if (ctl & IBS_FETCH_VAL) {
173 rdmsrl(MSR_AMD64_IBSFETCHLINAD, val);
174 oprofile_write_reserve(&entry, regs, val,
Robert Richter14f0ca82009-01-07 21:50:22 +0100175 IBS_FETCH_CODE, IBS_FETCH_SIZE);
Robert Richter51563a02009-06-03 20:54:56 +0200176 oprofile_add_data64(&entry, val);
177 oprofile_add_data64(&entry, ctl);
Robert Richterc572ae42009-06-03 20:10:39 +0200178 rdmsrl(MSR_AMD64_IBSFETCHPHYSAD, val);
Robert Richter51563a02009-06-03 20:54:56 +0200179 oprofile_add_data64(&entry, val);
Robert Richter14f0ca82009-01-07 21:50:22 +0100180 oprofile_write_commit(&entry);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200181
Robert Richterfd13f6c2008-10-19 21:00:09 +0200182 /* reenable the IRQ */
Robert Richtera163b102010-02-25 19:43:07 +0100183 ctl &= ~(IBS_FETCH_VAL | IBS_FETCH_CNT);
Robert Richterc572ae42009-06-03 20:10:39 +0200184 ctl |= IBS_FETCH_ENABLE;
185 wrmsrl(MSR_AMD64_IBSFETCHCTL, ctl);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200186 }
187 }
188
Robert Richter7939d2b2008-07-22 21:08:56 +0200189 if (ibs_config.op_enabled) {
Robert Richterc572ae42009-06-03 20:10:39 +0200190 rdmsrl(MSR_AMD64_IBSOPCTL, ctl);
191 if (ctl & IBS_OP_VAL) {
192 rdmsrl(MSR_AMD64_IBSOPRIP, val);
193 oprofile_write_reserve(&entry, regs, val,
Robert Richter14f0ca82009-01-07 21:50:22 +0100194 IBS_OP_CODE, IBS_OP_SIZE);
Robert Richter51563a02009-06-03 20:54:56 +0200195 oprofile_add_data64(&entry, val);
Robert Richterc572ae42009-06-03 20:10:39 +0200196 rdmsrl(MSR_AMD64_IBSOPDATA, val);
Robert Richter51563a02009-06-03 20:54:56 +0200197 oprofile_add_data64(&entry, val);
Robert Richterc572ae42009-06-03 20:10:39 +0200198 rdmsrl(MSR_AMD64_IBSOPDATA2, val);
Robert Richter51563a02009-06-03 20:54:56 +0200199 oprofile_add_data64(&entry, val);
Robert Richterc572ae42009-06-03 20:10:39 +0200200 rdmsrl(MSR_AMD64_IBSOPDATA3, val);
Robert Richter51563a02009-06-03 20:54:56 +0200201 oprofile_add_data64(&entry, val);
Robert Richterc572ae42009-06-03 20:10:39 +0200202 rdmsrl(MSR_AMD64_IBSDCLINAD, val);
Robert Richter51563a02009-06-03 20:54:56 +0200203 oprofile_add_data64(&entry, val);
Robert Richterc572ae42009-06-03 20:10:39 +0200204 rdmsrl(MSR_AMD64_IBSDCPHYSAD, val);
Robert Richter51563a02009-06-03 20:54:56 +0200205 oprofile_add_data64(&entry, val);
Robert Richter14f0ca82009-01-07 21:50:22 +0100206 oprofile_write_commit(&entry);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200207
208 /* reenable the IRQ */
Robert Richterba520782010-02-23 15:46:49 +0100209 ctl = op_amd_randomize_ibs_op(ibs_op_ctl);
Robert Richterc572ae42009-06-03 20:10:39 +0200210 wrmsrl(MSR_AMD64_IBSOPCTL, ctl);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200211 }
212 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213}
214
Robert Richter90637592009-03-10 19:15:57 +0100215static inline void op_amd_start_ibs(void)
216{
Robert Richterc572ae42009-06-03 20:10:39 +0200217 u64 val;
Robert Richter64683da2010-02-04 10:57:23 +0100218
219 if (!ibs_caps)
220 return;
221
222 if (ibs_config.fetch_enabled) {
Robert Richtera163b102010-02-25 19:43:07 +0100223 val = (ibs_config.max_cnt_fetch >> 4) & IBS_FETCH_MAX_CNT;
Robert Richterc572ae42009-06-03 20:10:39 +0200224 val |= ibs_config.rand_en ? IBS_FETCH_RAND_EN : 0;
225 val |= IBS_FETCH_ENABLE;
226 wrmsrl(MSR_AMD64_IBSFETCHCTL, val);
Robert Richter90637592009-03-10 19:15:57 +0100227 }
228
Robert Richter64683da2010-02-04 10:57:23 +0100229 if (ibs_config.op_enabled) {
Robert Richterba520782010-02-23 15:46:49 +0100230 ibs_op_ctl = ibs_config.max_cnt_op >> 4;
231 if (!(ibs_caps & IBS_CAPS_RDWROPCNT)) {
232 /*
233 * IbsOpCurCnt not supported. See
234 * op_amd_randomize_ibs_op() for details.
235 */
236 ibs_op_ctl = clamp(ibs_op_ctl, 0x0081ULL, 0xFF80ULL);
237 } else {
238 /*
239 * The start value is randomized with a
240 * positive offset, we need to compensate it
241 * with the half of the randomized range. Also
242 * avoid underflows.
243 */
244 ibs_op_ctl = min(ibs_op_ctl + IBS_RANDOM_MAXCNT_OFFSET,
Robert Richtera163b102010-02-25 19:43:07 +0100245 IBS_OP_MAX_CNT);
Robert Richterba520782010-02-23 15:46:49 +0100246 }
Robert Richter64683da2010-02-04 10:57:23 +0100247 if (ibs_caps & IBS_CAPS_OPCNT && ibs_config.dispatched_ops)
Robert Richterba520782010-02-23 15:46:49 +0100248 ibs_op_ctl |= IBS_OP_CNT_CTL;
249 ibs_op_ctl |= IBS_OP_ENABLE;
250 val = op_amd_randomize_ibs_op(ibs_op_ctl);
Robert Richterc572ae42009-06-03 20:10:39 +0200251 wrmsrl(MSR_AMD64_IBSOPCTL, val);
Robert Richter90637592009-03-10 19:15:57 +0100252 }
253}
254
255static void op_amd_stop_ibs(void)
256{
Robert Richter64683da2010-02-04 10:57:23 +0100257 if (!ibs_caps)
258 return;
259
260 if (ibs_config.fetch_enabled)
Robert Richter90637592009-03-10 19:15:57 +0100261 /* clear max count and enable */
Robert Richterc572ae42009-06-03 20:10:39 +0200262 wrmsrl(MSR_AMD64_IBSFETCHCTL, 0);
Robert Richter90637592009-03-10 19:15:57 +0100263
Robert Richter64683da2010-02-04 10:57:23 +0100264 if (ibs_config.op_enabled)
Robert Richter90637592009-03-10 19:15:57 +0100265 /* clear max count and enable */
Robert Richterc572ae42009-06-03 20:10:39 +0200266 wrmsrl(MSR_AMD64_IBSOPCTL, 0);
Robert Richter90637592009-03-10 19:15:57 +0100267}
268
Robert Richterda759fe2010-02-26 10:54:56 +0100269#ifdef CONFIG_OPROFILE_EVENT_MULTIPLEX
270
271static void op_mux_switch_ctrl(struct op_x86_model_spec const *model,
272 struct op_msrs const * const msrs)
273{
274 u64 val;
275 int i;
276
277 /* enable active counters */
278 for (i = 0; i < NUM_COUNTERS; ++i) {
279 int virt = op_x86_phys_to_virt(i);
280 if (!reset_value[virt])
281 continue;
282 rdmsrl(msrs->controls[i].addr, val);
283 val &= model->reserved;
284 val |= op_x86_get_ctrl(model, &counter_config[virt]);
285 wrmsrl(msrs->controls[i].addr, val);
286 }
287}
288
289#endif
290
291/* functions for op_amd_spec */
292
293static void op_amd_shutdown(struct op_msrs const * const msrs)
294{
295 int i;
296
297 for (i = 0; i < NUM_COUNTERS; ++i) {
298 if (!msrs->counters[i].addr)
299 continue;
300 release_perfctr_nmi(MSR_K7_PERFCTR0 + i);
301 release_evntsel_nmi(MSR_K7_EVNTSEL0 + i);
302 }
303}
304
305static int op_amd_fill_in_addresses(struct op_msrs * const msrs)
306{
307 int i;
308
309 for (i = 0; i < NUM_COUNTERS; i++) {
310 if (!reserve_perfctr_nmi(MSR_K7_PERFCTR0 + i))
311 goto fail;
312 if (!reserve_evntsel_nmi(MSR_K7_EVNTSEL0 + i)) {
313 release_perfctr_nmi(MSR_K7_PERFCTR0 + i);
314 goto fail;
315 }
316 /* both registers must be reserved */
317 msrs->counters[i].addr = MSR_K7_PERFCTR0 + i;
318 msrs->controls[i].addr = MSR_K7_EVNTSEL0 + i;
319 continue;
320 fail:
321 if (!counter_config[i].enabled)
322 continue;
323 op_x86_warn_reserved(i);
324 op_amd_shutdown(msrs);
325 return -EBUSY;
326 }
327
328 return 0;
329}
330
331static void op_amd_setup_ctrs(struct op_x86_model_spec const *model,
332 struct op_msrs const * const msrs)
333{
334 u64 val;
335 int i;
336
337 /* setup reset_value */
338 for (i = 0; i < NUM_VIRT_COUNTERS; ++i) {
339 if (counter_config[i].enabled
340 && msrs->counters[op_x86_virt_to_phys(i)].addr)
341 reset_value[i] = counter_config[i].count;
342 else
343 reset_value[i] = 0;
344 }
345
346 /* clear all counters */
347 for (i = 0; i < NUM_COUNTERS; ++i) {
348 if (!msrs->controls[i].addr)
349 continue;
350 rdmsrl(msrs->controls[i].addr, val);
351 if (val & ARCH_PERFMON_EVENTSEL_ENABLE)
352 op_x86_warn_in_use(i);
353 val &= model->reserved;
354 wrmsrl(msrs->controls[i].addr, val);
355 /*
356 * avoid a false detection of ctr overflows in NMI
357 * handler
358 */
359 wrmsrl(msrs->counters[i].addr, -1LL);
360 }
361
362 /* enable active counters */
363 for (i = 0; i < NUM_COUNTERS; ++i) {
364 int virt = op_x86_phys_to_virt(i);
365 if (!reset_value[virt])
366 continue;
367
368 /* setup counter registers */
369 wrmsrl(msrs->counters[i].addr, -(u64)reset_value[virt]);
370
371 /* setup control registers */
372 rdmsrl(msrs->controls[i].addr, val);
373 val &= model->reserved;
374 val |= op_x86_get_ctrl(model, &counter_config[virt]);
375 wrmsrl(msrs->controls[i].addr, val);
376 }
377}
378
Robert Richter7939d2b2008-07-22 21:08:56 +0200379static int op_amd_check_ctrs(struct pt_regs * const regs,
380 struct op_msrs const * const msrs)
381{
Robert Richter42399ad2009-05-25 17:59:06 +0200382 u64 val;
Robert Richter7939d2b2008-07-22 21:08:56 +0200383 int i;
384
Robert Richter6e63ea42009-07-07 19:25:39 +0200385 for (i = 0; i < NUM_COUNTERS; ++i) {
Robert Richterd8471ad2009-07-16 13:04:43 +0200386 int virt = op_x86_phys_to_virt(i);
387 if (!reset_value[virt])
Robert Richter7939d2b2008-07-22 21:08:56 +0200388 continue;
Robert Richter42399ad2009-05-25 17:59:06 +0200389 rdmsrl(msrs->counters[i].addr, val);
390 /* bit is clear if overflowed: */
391 if (val & OP_CTR_OVERFLOW)
392 continue;
Robert Richterd8471ad2009-07-16 13:04:43 +0200393 oprofile_add_sample(regs, virt);
394 wrmsrl(msrs->counters[i].addr, -(u64)reset_value[virt]);
Robert Richter7939d2b2008-07-22 21:08:56 +0200395 }
396
397 op_amd_handle_ibs(regs, msrs);
398
399 /* See op_model_ppro.c */
400 return 1;
401}
Paolo Ciarrocchid4413732008-02-19 23:51:27 +0100402
Robert Richter6657fe42008-07-22 21:08:50 +0200403static void op_amd_start(struct op_msrs const * const msrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404{
Robert Richterdea37662009-05-25 18:11:52 +0200405 u64 val;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406 int i;
Jason Yeh4d4036e2009-07-08 13:49:38 +0200407
Robert Richter6e63ea42009-07-07 19:25:39 +0200408 for (i = 0; i < NUM_COUNTERS; ++i) {
Robert Richterd8471ad2009-07-16 13:04:43 +0200409 if (!reset_value[op_x86_phys_to_virt(i)])
410 continue;
411 rdmsrl(msrs->controls[i].addr, val);
Robert Richterbb1165d2010-03-01 14:21:23 +0100412 val |= ARCH_PERFMON_EVENTSEL_ENABLE;
Robert Richterd8471ad2009-07-16 13:04:43 +0200413 wrmsrl(msrs->controls[i].addr, val);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 }
Robert Richter852402c2008-07-22 21:09:06 +0200415
Robert Richter90637592009-03-10 19:15:57 +0100416 op_amd_start_ibs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417}
418
Robert Richter6657fe42008-07-22 21:08:50 +0200419static void op_amd_stop(struct op_msrs const * const msrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700420{
Robert Richterdea37662009-05-25 18:11:52 +0200421 u64 val;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422 int i;
423
Robert Richterfd13f6c2008-10-19 21:00:09 +0200424 /*
425 * Subtle: stop on all counters to avoid race with setting our
426 * pm callback
427 */
Robert Richter6e63ea42009-07-07 19:25:39 +0200428 for (i = 0; i < NUM_COUNTERS; ++i) {
Robert Richterd8471ad2009-07-16 13:04:43 +0200429 if (!reset_value[op_x86_phys_to_virt(i)])
Don Zickuscb9c4482006-09-26 10:52:26 +0200430 continue;
Robert Richterdea37662009-05-25 18:11:52 +0200431 rdmsrl(msrs->controls[i].addr, val);
Robert Richterbb1165d2010-03-01 14:21:23 +0100432 val &= ~ARCH_PERFMON_EVENTSEL_ENABLE;
Robert Richterdea37662009-05-25 18:11:52 +0200433 wrmsrl(msrs->controls[i].addr, val);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700434 }
Barry Kasindorf56784f12008-07-22 21:08:55 +0200435
Robert Richter90637592009-03-10 19:15:57 +0100436 op_amd_stop_ibs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437}
438
Robert Richter7d77f2d2008-07-22 21:08:57 +0200439static u8 ibs_eilvt_off;
440
Barry Kasindorf56784f12008-07-22 21:08:55 +0200441static inline void apic_init_ibs_nmi_per_cpu(void *arg)
442{
Robert Richter7d77f2d2008-07-22 21:08:57 +0200443 ibs_eilvt_off = setup_APIC_eilvt_ibs(0, APIC_EILVT_MSG_NMI, 0);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200444}
445
446static inline void apic_clear_ibs_nmi_per_cpu(void *arg)
447{
448 setup_APIC_eilvt_ibs(0, APIC_EILVT_MSG_FIX, 1);
449}
450
Robert Richterfe615cb2008-11-24 14:58:03 +0100451static int init_ibs_nmi(void)
Robert Richter7d77f2d2008-07-22 21:08:57 +0200452{
453#define IBSCTL_LVTOFFSETVAL (1 << 8)
454#define IBSCTL 0x1cc
455 struct pci_dev *cpu_cfg;
456 int nodes;
457 u32 value = 0;
458
459 /* per CPU setup */
Robert Richterebb535d2008-07-22 21:08:59 +0200460 on_each_cpu(apic_init_ibs_nmi_per_cpu, NULL, 1);
Robert Richter7d77f2d2008-07-22 21:08:57 +0200461
462 nodes = 0;
463 cpu_cfg = NULL;
464 do {
465 cpu_cfg = pci_get_device(PCI_VENDOR_ID_AMD,
466 PCI_DEVICE_ID_AMD_10H_NB_MISC,
467 cpu_cfg);
468 if (!cpu_cfg)
469 break;
470 ++nodes;
471 pci_write_config_dword(cpu_cfg, IBSCTL, ibs_eilvt_off
472 | IBSCTL_LVTOFFSETVAL);
473 pci_read_config_dword(cpu_cfg, IBSCTL, &value);
474 if (value != (ibs_eilvt_off | IBSCTL_LVTOFFSETVAL)) {
Robert Richter83bd9242008-12-15 15:09:50 +0100475 pci_dev_put(cpu_cfg);
Robert Richter7d77f2d2008-07-22 21:08:57 +0200476 printk(KERN_DEBUG "Failed to setup IBS LVT offset, "
477 "IBSCTL = 0x%08x", value);
478 return 1;
479 }
480 } while (1);
481
482 if (!nodes) {
483 printk(KERN_DEBUG "No CPU node configured for IBS");
484 return 1;
485 }
486
Robert Richter7d77f2d2008-07-22 21:08:57 +0200487 return 0;
488}
489
Robert Richterfe615cb2008-11-24 14:58:03 +0100490/* uninitialize the APIC for the IBS interrupts if needed */
491static void clear_ibs_nmi(void)
492{
Robert Richter64683da2010-02-04 10:57:23 +0100493 if (ibs_caps)
Robert Richterfe615cb2008-11-24 14:58:03 +0100494 on_each_cpu(apic_clear_ibs_nmi_per_cpu, NULL, 1);
495}
496
Robert Richterfd13f6c2008-10-19 21:00:09 +0200497/* initialize the APIC for the IBS interrupts if available */
Robert Richterfe615cb2008-11-24 14:58:03 +0100498static void ibs_init(void)
Barry Kasindorf56784f12008-07-22 21:08:55 +0200499{
Robert Richter64683da2010-02-04 10:57:23 +0100500 ibs_caps = get_ibs_caps();
Barry Kasindorf56784f12008-07-22 21:08:55 +0200501
Robert Richter64683da2010-02-04 10:57:23 +0100502 if (!ibs_caps)
Barry Kasindorf56784f12008-07-22 21:08:55 +0200503 return;
504
Robert Richterfe615cb2008-11-24 14:58:03 +0100505 if (init_ibs_nmi()) {
Robert Richter64683da2010-02-04 10:57:23 +0100506 ibs_caps = 0;
Robert Richter852402c2008-07-22 21:09:06 +0200507 return;
508 }
509
Robert Richter64683da2010-02-04 10:57:23 +0100510 printk(KERN_INFO "oprofile: AMD IBS detected (0x%08x)\n",
511 (unsigned)ibs_caps);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200512}
513
Robert Richterfe615cb2008-11-24 14:58:03 +0100514static void ibs_exit(void)
Barry Kasindorf56784f12008-07-22 21:08:55 +0200515{
Robert Richter64683da2010-02-04 10:57:23 +0100516 if (!ibs_caps)
Robert Richterfe615cb2008-11-24 14:58:03 +0100517 return;
518
519 clear_ibs_nmi();
Barry Kasindorf56784f12008-07-22 21:08:55 +0200520}
521
Robert Richter25ad29132008-09-05 17:12:36 +0200522static int (*create_arch_files)(struct super_block *sb, struct dentry *root);
Robert Richter270d3e12008-07-22 21:09:01 +0200523
Robert Richter25ad29132008-09-05 17:12:36 +0200524static int setup_ibs_files(struct super_block *sb, struct dentry *root)
Barry Kasindorf56784f12008-07-22 21:08:55 +0200525{
Barry Kasindorf56784f12008-07-22 21:08:55 +0200526 struct dentry *dir;
Robert Richter270d3e12008-07-22 21:09:01 +0200527 int ret = 0;
528
529 /* architecture specific files */
530 if (create_arch_files)
531 ret = create_arch_files(sb, root);
532
533 if (ret)
534 return ret;
Barry Kasindorf56784f12008-07-22 21:08:55 +0200535
Robert Richter64683da2010-02-04 10:57:23 +0100536 if (!ibs_caps)
Robert Richter270d3e12008-07-22 21:09:01 +0200537 return ret;
538
539 /* model specific files */
Barry Kasindorf56784f12008-07-22 21:08:55 +0200540
541 /* setup some reasonable defaults */
542 ibs_config.max_cnt_fetch = 250000;
543 ibs_config.fetch_enabled = 0;
544 ibs_config.max_cnt_op = 250000;
545 ibs_config.op_enabled = 0;
Robert Richter64683da2010-02-04 10:57:23 +0100546 ibs_config.dispatched_ops = 0;
Robert Richter2d55a472008-07-18 17:56:05 +0200547
548 dir = oprofilefs_mkdir(sb, root, "ibs_fetch");
549 oprofilefs_create_ulong(sb, dir, "enable",
550 &ibs_config.fetch_enabled);
551 oprofilefs_create_ulong(sb, dir, "max_count",
552 &ibs_config.max_cnt_fetch);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200553 oprofilefs_create_ulong(sb, dir, "rand_enable",
554 &ibs_config.rand_en);
Robert Richter2d55a472008-07-18 17:56:05 +0200555
Robert Richterccd755c2008-07-29 16:57:10 +0200556 dir = oprofilefs_mkdir(sb, root, "ibs_op");
Barry Kasindorf56784f12008-07-22 21:08:55 +0200557 oprofilefs_create_ulong(sb, dir, "enable",
Robert Richter2d55a472008-07-18 17:56:05 +0200558 &ibs_config.op_enabled);
Barry Kasindorf56784f12008-07-22 21:08:55 +0200559 oprofilefs_create_ulong(sb, dir, "max_count",
Robert Richter2d55a472008-07-18 17:56:05 +0200560 &ibs_config.max_cnt_op);
Robert Richter64683da2010-02-04 10:57:23 +0100561 if (ibs_caps & IBS_CAPS_OPCNT)
562 oprofilefs_create_ulong(sb, dir, "dispatched_ops",
563 &ibs_config.dispatched_ops);
Robert Richterfc2bd732008-07-22 21:09:00 +0200564
565 return 0;
Barry Kasindorf56784f12008-07-22 21:08:55 +0200566}
567
Robert Richteradf5ec02008-07-22 21:08:48 +0200568static int op_amd_init(struct oprofile_operations *ops)
569{
Robert Richterfe615cb2008-11-24 14:58:03 +0100570 ibs_init();
Robert Richter270d3e12008-07-22 21:09:01 +0200571 create_arch_files = ops->create_files;
572 ops->create_files = setup_ibs_files;
Robert Richteradf5ec02008-07-22 21:08:48 +0200573 return 0;
574}
575
576static void op_amd_exit(void)
577{
Robert Richterfe615cb2008-11-24 14:58:03 +0100578 ibs_exit();
Robert Richteradf5ec02008-07-22 21:08:48 +0200579}
580
Robert Richter259a83a2009-07-09 15:12:35 +0200581struct op_x86_model_spec op_amd_spec = {
Robert Richterc92960f2008-09-05 17:12:36 +0200582 .num_counters = NUM_COUNTERS,
Robert Richterd0e41202010-03-23 19:33:21 +0100583 .num_controls = NUM_COUNTERS,
Jason Yeh4d4036e2009-07-08 13:49:38 +0200584 .num_virt_counters = NUM_VIRT_COUNTERS,
Robert Richter3370d352009-05-25 15:10:32 +0200585 .reserved = MSR_AMD_EVENTSEL_RESERVED,
586 .event_mask = OP_EVENT_MASK,
587 .init = op_amd_init,
588 .exit = op_amd_exit,
Robert Richterc92960f2008-09-05 17:12:36 +0200589 .fill_in_addresses = &op_amd_fill_in_addresses,
590 .setup_ctrs = &op_amd_setup_ctrs,
591 .check_ctrs = &op_amd_check_ctrs,
592 .start = &op_amd_start,
593 .stop = &op_amd_stop,
Robert Richter3370d352009-05-25 15:10:32 +0200594 .shutdown = &op_amd_shutdown,
Jason Yeh4d4036e2009-07-08 13:49:38 +0200595#ifdef CONFIG_OPROFILE_EVENT_MULTIPLEX
Robert Richter7e7478c2009-07-16 13:09:53 +0200596 .switch_ctrl = &op_mux_switch_ctrl,
Jason Yeh4d4036e2009-07-08 13:49:38 +0200597#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598};