blob: d85d1e6b1988875d0874eebb9e77d5c1b382c969 [file] [log] [blame]
Heiko Carstensa53c8fa2012-07-20 11:15:04 +02001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * S390 Version
Heiko Carstensa53c8fa2012-07-20 11:15:04 +02003 * Copyright IBM Corp. 2002, 2011
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * Author(s): Thomas Spatzier (tspat@de.ibm.com)
Heinz Graalfsc814d162011-02-15 13:02:14 -05005 * Author(s): Mahesh Salgaonkar (mahesh@linux.vnet.ibm.com)
6 * Author(s): Heinz Graalfs (graalfs@linux.vnet.ibm.com)
Andreas Krebbeldd3c4672011-11-25 20:03:05 +01007 * Author(s): Andreas Krebbel (krebbel@linux.vnet.ibm.com)
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 *
Heinz Graalfsc814d162011-02-15 13:02:14 -05009 * @remark Copyright 2002-2011 OProfile authors
Linus Torvalds1da177e2005-04-16 15:20:36 -070010 */
11
12#include <linux/oprofile.h>
Hendrik Bruecknere28bb792013-12-12 16:52:48 +010013#include <linux/perf_event.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070014#include <linux/init.h>
15#include <linux/errno.h>
Heinz Graalfsc814d162011-02-15 13:02:14 -050016#include <linux/fs.h>
Andreas Krebbeldd3c4672011-11-25 20:03:05 +010017#include <linux/module.h>
18#include <asm/processor.h>
Sebastian Otta215c8f2015-06-25 14:52:13 +020019#include <asm/perf_event.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020
Heinz Graalfsc814d162011-02-15 13:02:14 -050021#include "../../../drivers/oprofile/oprof.h"
Heiko Carstens984e8482011-03-23 10:15:00 +010022
Heinz Graalfsc814d162011-02-15 13:02:14 -050023#include "hwsampler.h"
Andreas Krebbeldd3c4672011-11-25 20:03:05 +010024#include "op_counter.h"
Heinz Graalfsc814d162011-02-15 13:02:14 -050025
Christian Borntraeger68158232011-06-22 16:24:09 +020026#define DEFAULT_INTERVAL 4127518
Heinz Graalfsc814d162011-02-15 13:02:14 -050027
28#define DEFAULT_SDBT_BLOCKS 1
29#define DEFAULT_SDB_BLOCKS 511
30
31static unsigned long oprofile_hw_interval = DEFAULT_INTERVAL;
32static unsigned long oprofile_min_interval;
33static unsigned long oprofile_max_interval;
34
35static unsigned long oprofile_sdbt_blocks = DEFAULT_SDBT_BLOCKS;
36static unsigned long oprofile_sdb_blocks = DEFAULT_SDB_BLOCKS;
37
Andreas Krebbeldd3c4672011-11-25 20:03:05 +010038static int hwsampler_enabled;
Heinz Graalfsc814d162011-02-15 13:02:14 -050039static int hwsampler_running; /* start_mutex must be held to change */
Andreas Krebbeldd3c4672011-11-25 20:03:05 +010040static int hwsampler_available;
Heinz Graalfsc814d162011-02-15 13:02:14 -050041
42static struct oprofile_operations timer_ops;
Andreas Krebbeld0f4c162006-01-06 00:19:16 -080043
Andreas Krebbeldd3c4672011-11-25 20:03:05 +010044struct op_counter_config counter_config;
45
46enum __force_cpu_type {
47 reserved = 0, /* do not force */
48 timer,
49};
50static int force_cpu_type;
51
52static int set_cpu_type(const char *str, struct kernel_param *kp)
53{
54 if (!strcmp(str, "timer")) {
55 force_cpu_type = timer;
56 printk(KERN_INFO "oprofile: forcing timer to be returned "
57 "as cpu type\n");
58 } else {
59 force_cpu_type = 0;
60 }
61
62 return 0;
63}
64module_param_call(cpu_type, set_cpu_type, NULL, NULL, 0);
65MODULE_PARM_DESC(cpu_type, "Force legacy basic mode sampling"
66 "(report cpu_type \"timer\"");
67
Hendrik Bruecknere28bb792013-12-12 16:52:48 +010068static int __oprofile_hwsampler_start(void)
69{
70 int retval;
71
72 retval = hwsampler_allocate(oprofile_sdbt_blocks, oprofile_sdb_blocks);
73 if (retval)
74 return retval;
75
76 retval = hwsampler_start_all(oprofile_hw_interval);
77 if (retval)
78 hwsampler_deallocate();
79
80 return retval;
81}
82
Heinz Graalfsc814d162011-02-15 13:02:14 -050083static int oprofile_hwsampler_start(void)
84{
85 int retval;
86
Andreas Krebbeldd3c4672011-11-25 20:03:05 +010087 hwsampler_running = hwsampler_enabled;
Heinz Graalfsc814d162011-02-15 13:02:14 -050088
89 if (!hwsampler_running)
90 return timer_ops.start();
91
Hendrik Bruecknere28bb792013-12-12 16:52:48 +010092 retval = perf_reserve_sampling();
Heinz Graalfsc814d162011-02-15 13:02:14 -050093 if (retval)
94 return retval;
95
Hendrik Bruecknere28bb792013-12-12 16:52:48 +010096 retval = __oprofile_hwsampler_start();
Heinz Graalfsc814d162011-02-15 13:02:14 -050097 if (retval)
Hendrik Bruecknere28bb792013-12-12 16:52:48 +010098 perf_release_sampling();
Heinz Graalfsc814d162011-02-15 13:02:14 -050099
100 return retval;
101}
102
103static void oprofile_hwsampler_stop(void)
104{
105 if (!hwsampler_running) {
106 timer_ops.stop();
107 return;
108 }
109
110 hwsampler_stop_all();
111 hwsampler_deallocate();
Hendrik Bruecknere28bb792013-12-12 16:52:48 +0100112 perf_release_sampling();
Heinz Graalfsc814d162011-02-15 13:02:14 -0500113 return;
114}
115
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100116/*
117 * File ops used for:
118 * /dev/oprofile/0/enabled
119 * /dev/oprofile/hwsampling/hwsampler (cpu_type = timer)
120 */
121
Heinz Graalfsc814d162011-02-15 13:02:14 -0500122static ssize_t hwsampler_read(struct file *file, char __user *buf,
123 size_t count, loff_t *offset)
124{
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100125 return oprofilefs_ulong_to_user(hwsampler_enabled, buf, count, offset);
Heinz Graalfsc814d162011-02-15 13:02:14 -0500126}
127
128static ssize_t hwsampler_write(struct file *file, char const __user *buf,
129 size_t count, loff_t *offset)
130{
131 unsigned long val;
132 int retval;
133
134 if (*offset)
135 return -EINVAL;
136
137 retval = oprofilefs_ulong_from_user(&val, buf, count);
Robert Richter913050b2011-12-19 16:38:30 +0100138 if (retval <= 0)
Heinz Graalfsc814d162011-02-15 13:02:14 -0500139 return retval;
140
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100141 if (val != 0 && val != 1)
142 return -EINVAL;
143
Heinz Graalfsc814d162011-02-15 13:02:14 -0500144 if (oprofile_started)
145 /*
146 * save to do without locking as we set
147 * hwsampler_running in start() when start_mutex is
148 * held
149 */
150 return -EBUSY;
151
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100152 hwsampler_enabled = val;
Heinz Graalfsc814d162011-02-15 13:02:14 -0500153
154 return count;
155}
156
157static const struct file_operations hwsampler_fops = {
158 .read = hwsampler_read,
159 .write = hwsampler_write,
160};
161
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100162/*
163 * File ops used for:
164 * /dev/oprofile/0/count
165 * /dev/oprofile/hwsampling/hw_interval (cpu_type = timer)
166 *
167 * Make sure that the value is within the hardware range.
168 */
169
170static ssize_t hw_interval_read(struct file *file, char __user *buf,
171 size_t count, loff_t *offset)
Heinz Graalfsc814d162011-02-15 13:02:14 -0500172{
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100173 return oprofilefs_ulong_to_user(oprofile_hw_interval, buf,
174 count, offset);
175}
Heinz Graalfsc814d162011-02-15 13:02:14 -0500176
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100177static ssize_t hw_interval_write(struct file *file, char const __user *buf,
178 size_t count, loff_t *offset)
179{
180 unsigned long val;
181 int retval;
Heinz Graalfsc814d162011-02-15 13:02:14 -0500182
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100183 if (*offset)
184 return -EINVAL;
185 retval = oprofilefs_ulong_from_user(&val, buf, count);
Robert Richter81ff3472012-07-19 18:28:26 +0200186 if (retval <= 0)
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100187 return retval;
188 if (val < oprofile_min_interval)
189 oprofile_hw_interval = oprofile_min_interval;
190 else if (val > oprofile_max_interval)
191 oprofile_hw_interval = oprofile_max_interval;
192 else
193 oprofile_hw_interval = val;
194
195 return count;
196}
197
198static const struct file_operations hw_interval_fops = {
199 .read = hw_interval_read,
200 .write = hw_interval_write,
201};
202
203/*
204 * File ops used for:
205 * /dev/oprofile/0/event
206 * Only a single event with number 0 is supported with this counter.
207 *
208 * /dev/oprofile/0/unit_mask
209 * This is a dummy file needed by the user space tools.
210 * No value other than 0 is accepted or returned.
211 */
212
213static ssize_t hwsampler_zero_read(struct file *file, char __user *buf,
214 size_t count, loff_t *offset)
215{
216 return oprofilefs_ulong_to_user(0, buf, count, offset);
217}
218
219static ssize_t hwsampler_zero_write(struct file *file, char const __user *buf,
220 size_t count, loff_t *offset)
221{
222 unsigned long val;
223 int retval;
224
225 if (*offset)
Heinz Graalfsc814d162011-02-15 13:02:14 -0500226 return -EINVAL;
227
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100228 retval = oprofilefs_ulong_from_user(&val, buf, count);
Robert Richter81ff3472012-07-19 18:28:26 +0200229 if (retval <= 0)
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100230 return retval;
231 if (val != 0)
232 return -EINVAL;
233 return count;
234}
Heinz Graalfsc814d162011-02-15 13:02:14 -0500235
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100236static const struct file_operations zero_fops = {
237 .read = hwsampler_zero_read,
238 .write = hwsampler_zero_write,
239};
240
241/* /dev/oprofile/0/kernel file ops. */
242
243static ssize_t hwsampler_kernel_read(struct file *file, char __user *buf,
244 size_t count, loff_t *offset)
245{
246 return oprofilefs_ulong_to_user(counter_config.kernel,
247 buf, count, offset);
248}
249
250static ssize_t hwsampler_kernel_write(struct file *file, char const __user *buf,
251 size_t count, loff_t *offset)
252{
253 unsigned long val;
254 int retval;
255
256 if (*offset)
257 return -EINVAL;
258
259 retval = oprofilefs_ulong_from_user(&val, buf, count);
Robert Richter81ff3472012-07-19 18:28:26 +0200260 if (retval <= 0)
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100261 return retval;
262
263 if (val != 0 && val != 1)
264 return -EINVAL;
265
266 counter_config.kernel = val;
267
268 return count;
269}
270
271static const struct file_operations kernel_fops = {
272 .read = hwsampler_kernel_read,
273 .write = hwsampler_kernel_write,
274};
275
276/* /dev/oprofile/0/user file ops. */
277
278static ssize_t hwsampler_user_read(struct file *file, char __user *buf,
279 size_t count, loff_t *offset)
280{
281 return oprofilefs_ulong_to_user(counter_config.user,
282 buf, count, offset);
283}
284
285static ssize_t hwsampler_user_write(struct file *file, char const __user *buf,
286 size_t count, loff_t *offset)
287{
288 unsigned long val;
289 int retval;
290
291 if (*offset)
292 return -EINVAL;
293
294 retval = oprofilefs_ulong_from_user(&val, buf, count);
Robert Richter81ff3472012-07-19 18:28:26 +0200295 if (retval <= 0)
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100296 return retval;
297
298 if (val != 0 && val != 1)
299 return -EINVAL;
300
301 counter_config.user = val;
302
303 return count;
304}
305
306static const struct file_operations user_fops = {
307 .read = hwsampler_user_read,
308 .write = hwsampler_user_write,
309};
310
311
312/*
313 * File ops used for: /dev/oprofile/timer/enabled
314 * The value always has to be the inverted value of hwsampler_enabled. So
315 * no separate variable is created. That way we do not need locking.
316 */
317
318static ssize_t timer_enabled_read(struct file *file, char __user *buf,
319 size_t count, loff_t *offset)
320{
321 return oprofilefs_ulong_to_user(!hwsampler_enabled, buf, count, offset);
322}
323
324static ssize_t timer_enabled_write(struct file *file, char const __user *buf,
325 size_t count, loff_t *offset)
326{
327 unsigned long val;
328 int retval;
329
330 if (*offset)
331 return -EINVAL;
332
333 retval = oprofilefs_ulong_from_user(&val, buf, count);
Robert Richter81ff3472012-07-19 18:28:26 +0200334 if (retval <= 0)
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100335 return retval;
336
337 if (val != 0 && val != 1)
338 return -EINVAL;
339
340 /* Timer cannot be disabled without having hardware sampling. */
341 if (val == 0 && !hwsampler_available)
342 return -EINVAL;
343
344 if (oprofile_started)
345 /*
346 * save to do without locking as we set
347 * hwsampler_running in start() when start_mutex is
348 * held
349 */
350 return -EBUSY;
351
352 hwsampler_enabled = !val;
353
354 return count;
355}
356
357static const struct file_operations timer_enabled_fops = {
358 .read = timer_enabled_read,
359 .write = timer_enabled_write,
360};
361
362
Al Viroef7bca12013-07-19 15:52:42 +0400363static int oprofile_create_hwsampling_files(struct dentry *root)
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100364{
365 struct dentry *dir;
366
Al Viroecde2822013-07-19 15:58:27 +0400367 dir = oprofilefs_mkdir(root, "timer");
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100368 if (!dir)
369 return -EINVAL;
370
Al Viro6af4ea02013-07-19 16:10:36 +0400371 oprofilefs_create_file(dir, "enabled", &timer_enabled_fops);
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100372
373 if (!hwsampler_available)
374 return 0;
375
376 /* reinitialize default values */
377 hwsampler_enabled = 1;
378 counter_config.kernel = 1;
379 counter_config.user = 1;
380
381 if (!force_cpu_type) {
382 /*
383 * Create the counter file system. A single virtual
384 * counter is created which can be used to
385 * enable/disable hardware sampling dynamically from
386 * user space. The user space will configure a single
387 * counter with a single event. The value of 'event'
388 * and 'unit_mask' are not evaluated by the kernel code
389 * and can only be set to 0.
390 */
391
Al Viroecde2822013-07-19 15:58:27 +0400392 dir = oprofilefs_mkdir(root, "0");
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100393 if (!dir)
394 return -EINVAL;
395
Al Viro6af4ea02013-07-19 16:10:36 +0400396 oprofilefs_create_file(dir, "enabled", &hwsampler_fops);
397 oprofilefs_create_file(dir, "event", &zero_fops);
398 oprofilefs_create_file(dir, "count", &hw_interval_fops);
399 oprofilefs_create_file(dir, "unit_mask", &zero_fops);
400 oprofilefs_create_file(dir, "kernel", &kernel_fops);
401 oprofilefs_create_file(dir, "user", &user_fops);
402 oprofilefs_create_ulong(dir, "hw_sdbt_blocks",
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100403 &oprofile_sdbt_blocks);
404
405 } else {
406 /*
407 * Hardware sampling can be used but the cpu_type is
408 * forced to timer in order to deal with legacy user
409 * space tools. The /dev/oprofile/hwsampling fs is
410 * provided in that case.
411 */
Al Viroecde2822013-07-19 15:58:27 +0400412 dir = oprofilefs_mkdir(root, "hwsampling");
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100413 if (!dir)
414 return -EINVAL;
415
Al Viro6af4ea02013-07-19 16:10:36 +0400416 oprofilefs_create_file(dir, "hwsampler",
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100417 &hwsampler_fops);
Al Viro6af4ea02013-07-19 16:10:36 +0400418 oprofilefs_create_file(dir, "hw_interval",
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100419 &hw_interval_fops);
Al Viro6af4ea02013-07-19 16:10:36 +0400420 oprofilefs_create_ro_ulong(dir, "hw_min_interval",
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100421 &oprofile_min_interval);
Al Viro6af4ea02013-07-19 16:10:36 +0400422 oprofilefs_create_ro_ulong(dir, "hw_max_interval",
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100423 &oprofile_max_interval);
Al Viro6af4ea02013-07-19 16:10:36 +0400424 oprofilefs_create_ulong(dir, "hw_sdbt_blocks",
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100425 &oprofile_sdbt_blocks);
426 }
Heinz Graalfsc814d162011-02-15 13:02:14 -0500427 return 0;
428}
429
Robert Richterec6b4262011-03-16 12:10:12 +0100430static int oprofile_hwsampler_init(struct oprofile_operations *ops)
Heinz Graalfsc814d162011-02-15 13:02:14 -0500431{
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100432 /*
433 * Initialize the timer mode infrastructure as well in order
434 * to be able to switch back dynamically. oprofile_timer_init
435 * is not supposed to fail.
436 */
437 if (oprofile_timer_init(ops))
438 BUG();
439
440 memcpy(&timer_ops, ops, sizeof(timer_ops));
441 ops->create_files = oprofile_create_hwsampling_files;
442
443 /*
444 * If the user space tools do not support newer cpu types,
445 * the force_cpu_type module parameter
446 * can be used to always return \"timer\" as cpu type.
447 */
448 if (force_cpu_type != timer) {
449 struct cpuid id;
450
451 get_cpu_id (&id);
452
453 switch (id.machine) {
454 case 0x2097: case 0x2098: ops->cpu_type = "s390/z10"; break;
455 case 0x2817: case 0x2818: ops->cpu_type = "s390/z196"; break;
Heiko Carstens59471222013-07-24 10:35:33 +0200456 case 0x2827: case 0x2828: ops->cpu_type = "s390/zEC12"; break;
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100457 default: return -ENODEV;
458 }
459 }
460
Heinz Graalfsc814d162011-02-15 13:02:14 -0500461 if (hwsampler_setup())
462 return -ENODEV;
463
464 /*
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100465 * Query the range for the sampling interval from the
466 * hardware.
Heinz Graalfsc814d162011-02-15 13:02:14 -0500467 */
468 oprofile_min_interval = hwsampler_query_min_interval();
Martin Schwidefsky3d8dcb32011-05-10 17:13:42 +0200469 if (oprofile_min_interval == 0)
Heinz Graalfsc814d162011-02-15 13:02:14 -0500470 return -ENODEV;
Heinz Graalfsc814d162011-02-15 13:02:14 -0500471 oprofile_max_interval = hwsampler_query_max_interval();
Martin Schwidefsky3d8dcb32011-05-10 17:13:42 +0200472 if (oprofile_max_interval == 0)
Heinz Graalfsc814d162011-02-15 13:02:14 -0500473 return -ENODEV;
Heinz Graalfsc814d162011-02-15 13:02:14 -0500474
Christian Borntraegerb530ce72011-06-22 16:24:08 +0200475 /* The initial value should be sane */
476 if (oprofile_hw_interval < oprofile_min_interval)
477 oprofile_hw_interval = oprofile_min_interval;
478 if (oprofile_hw_interval > oprofile_max_interval)
479 oprofile_hw_interval = oprofile_max_interval;
480
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100481 printk(KERN_INFO "oprofile: System z hardware sampling "
482 "facility found.\n");
Heinz Graalfsc814d162011-02-15 13:02:14 -0500483
484 ops->start = oprofile_hwsampler_start;
485 ops->stop = oprofile_hwsampler_stop;
Heinz Graalfsc814d162011-02-15 13:02:14 -0500486
487 return 0;
488}
489
Robert Richterec6b4262011-03-16 12:10:12 +0100490static void oprofile_hwsampler_exit(void)
Heinz Graalfsc814d162011-02-15 13:02:14 -0500491{
Heinz Graalfsc814d162011-02-15 13:02:14 -0500492 hwsampler_shutdown();
493}
494
Heiko Carstens758d39e2016-02-09 12:58:54 +0100495static int __s390_backtrace(void *data, unsigned long address)
496{
497 unsigned int *depth = data;
498
499 if (*depth == 0)
500 return 1;
501 (*depth)--;
502 oprofile_add_trace(address);
503 return 0;
504}
505
506static void s390_backtrace(struct pt_regs *regs, unsigned int depth)
507{
508 if (user_mode(regs))
509 return;
510 dump_trace(__s390_backtrace, &depth, NULL, regs->gprs[15]);
511}
512
Robert Richterec6b4262011-03-16 12:10:12 +0100513int __init oprofile_arch_init(struct oprofile_operations *ops)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700514{
Andreas Krebbeld0f4c162006-01-06 00:19:16 -0800515 ops->backtrace = s390_backtrace;
Heinz Graalfs997dbb42011-01-21 10:06:53 +0000516
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100517 /*
518 * -ENODEV is not reported to the caller. The module itself
519 * will use the timer mode sampling as fallback and this is
520 * always available.
521 */
522 hwsampler_available = oprofile_hwsampler_init(ops) == 0;
523
524 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525}
526
527void oprofile_arch_exit(void)
528{
Heinz Graalfs997dbb42011-01-21 10:06:53 +0000529 oprofile_hwsampler_exit();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530}