blob: 0cb385da202c60836fd2cd006e5950ed448de656 [file] [log] [blame]
Heiko Carstensa53c8fa2012-07-20 11:15:04 +02001/*
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00002 * Copyright IBM Corp. 2010
3 * Author: Heinz Graalfs <graalfs@de.ibm.com>
4 */
5
Heiko Carstensfcdd65b2011-05-23 10:24:48 +02006#include <linux/kernel_stat.h>
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00007#include <linux/kernel.h>
8#include <linux/module.h>
9#include <linux/smp.h>
10#include <linux/errno.h>
11#include <linux/workqueue.h>
12#include <linux/interrupt.h>
13#include <linux/notifier.h>
14#include <linux/cpu.h>
15#include <linux/semaphore.h>
16#include <linux/oom.h>
17#include <linux/oprofile.h>
18
David Howellsa0616cd2012-03-28 18:30:02 +010019#include <asm/facility.h>
Jan Glauberb03d541a2012-03-23 11:13:05 +010020#include <asm/cpu_mf.h>
Heiko Carstensd7b250e2011-05-26 09:48:24 +020021#include <asm/irq.h>
Heinz Graalfsec6a3df2011-01-21 10:06:52 +000022
23#include "hwsampler.h"
Andreas Krebbeldd3c4672011-11-25 20:03:05 +010024#include "op_counter.h"
Heinz Graalfsec6a3df2011-01-21 10:06:52 +000025
26#define MAX_NUM_SDB 511
27#define MIN_NUM_SDB 1
28
29#define ALERT_REQ_MASK 0x4000000000000000ul
30#define BUFFER_FULL_MASK 0x8000000000000000ul
31
Heinz Graalfsec6a3df2011-01-21 10:06:52 +000032DECLARE_PER_CPU(struct hws_cpu_buffer, sampler_cpu_buffer);
33
34struct hws_execute_parms {
35 void *buffer;
36 signed int rc;
37};
38
39DEFINE_PER_CPU(struct hws_cpu_buffer, sampler_cpu_buffer);
40EXPORT_PER_CPU_SYMBOL(sampler_cpu_buffer);
41
42static DEFINE_MUTEX(hws_sem);
43static DEFINE_MUTEX(hws_sem_oom);
44
45static unsigned char hws_flush_all;
46static unsigned int hws_oom;
47static struct workqueue_struct *hws_wq;
48
49static unsigned int hws_state;
50enum {
51 HWS_INIT = 1,
52 HWS_DEALLOCATED,
53 HWS_STOPPED,
54 HWS_STARTED,
55 HWS_STOPPING };
56
57/* set to 1 if called by kernel during memory allocation */
58static unsigned char oom_killer_was_active;
59/* size of SDBT and SDB as of allocate API */
60static unsigned long num_sdbt = 100;
61static unsigned long num_sdb = 511;
62/* sampling interval (machine cycles) */
63static unsigned long interval;
64
65static unsigned long min_sampler_rate;
66static unsigned long max_sampler_rate;
67
68static int ssctl(void *buffer)
69{
70 int cc;
71
72 /* set in order to detect a program check */
73 cc = 1;
74
75 asm volatile(
76 "0: .insn s,0xB2870000,0(%1)\n"
77 "1: ipm %0\n"
78 " srl %0,28\n"
79 "2:\n"
80 EX_TABLE(0b, 2b) EX_TABLE(1b, 2b)
81 : "+d" (cc), "+a" (buffer)
82 : "m" (*((struct hws_ssctl_request_block *)buffer))
83 : "cc", "memory");
84
85 return cc ? -EINVAL : 0 ;
86}
87
88static int qsi(void *buffer)
89{
90 int cc;
91 cc = 1;
92
93 asm volatile(
94 "0: .insn s,0xB2860000,0(%1)\n"
95 "1: lhi %0,0\n"
96 "2:\n"
97 EX_TABLE(0b, 2b) EX_TABLE(1b, 2b)
98 : "=d" (cc), "+a" (buffer)
99 : "m" (*((struct hws_qsi_info_block *)buffer))
100 : "cc", "memory");
101
102 return cc ? -EINVAL : 0;
103}
104
105static void execute_qsi(void *parms)
106{
107 struct hws_execute_parms *ep = parms;
108
109 ep->rc = qsi(ep->buffer);
110}
111
112static void execute_ssctl(void *parms)
113{
114 struct hws_execute_parms *ep = parms;
115
116 ep->rc = ssctl(ep->buffer);
117}
118
119static int smp_ctl_ssctl_stop(int cpu)
120{
121 int rc;
122 struct hws_execute_parms ep;
123 struct hws_cpu_buffer *cb;
124
125 cb = &per_cpu(sampler_cpu_buffer, cpu);
126
127 cb->ssctl.es = 0;
128 cb->ssctl.cs = 0;
129
130 ep.buffer = &cb->ssctl;
131 smp_call_function_single(cpu, execute_ssctl, &ep, 1);
132 rc = ep.rc;
133 if (rc) {
134 printk(KERN_ERR "hwsampler: CPU %d CPUMF SSCTL failed.\n", cpu);
135 dump_stack();
136 }
137
138 ep.buffer = &cb->qsi;
139 smp_call_function_single(cpu, execute_qsi, &ep, 1);
140
141 if (cb->qsi.es || cb->qsi.cs) {
142 printk(KERN_EMERG "CPUMF sampling did not stop properly.\n");
143 dump_stack();
144 }
145
146 return rc;
147}
148
149static int smp_ctl_ssctl_deactivate(int cpu)
150{
151 int rc;
152 struct hws_execute_parms ep;
153 struct hws_cpu_buffer *cb;
154
155 cb = &per_cpu(sampler_cpu_buffer, cpu);
156
157 cb->ssctl.es = 1;
158 cb->ssctl.cs = 0;
159
160 ep.buffer = &cb->ssctl;
161 smp_call_function_single(cpu, execute_ssctl, &ep, 1);
162 rc = ep.rc;
163 if (rc)
164 printk(KERN_ERR "hwsampler: CPU %d CPUMF SSCTL failed.\n", cpu);
165
166 ep.buffer = &cb->qsi;
167 smp_call_function_single(cpu, execute_qsi, &ep, 1);
168
169 if (cb->qsi.cs)
170 printk(KERN_EMERG "CPUMF sampling was not set inactive.\n");
171
172 return rc;
173}
174
175static int smp_ctl_ssctl_enable_activate(int cpu, unsigned long interval)
176{
177 int rc;
178 struct hws_execute_parms ep;
179 struct hws_cpu_buffer *cb;
180
181 cb = &per_cpu(sampler_cpu_buffer, cpu);
182
183 cb->ssctl.h = 1;
184 cb->ssctl.tear = cb->first_sdbt;
185 cb->ssctl.dear = *(unsigned long *) cb->first_sdbt;
186 cb->ssctl.interval = interval;
187 cb->ssctl.es = 1;
188 cb->ssctl.cs = 1;
189
190 ep.buffer = &cb->ssctl;
191 smp_call_function_single(cpu, execute_ssctl, &ep, 1);
192 rc = ep.rc;
193 if (rc)
194 printk(KERN_ERR "hwsampler: CPU %d CPUMF SSCTL failed.\n", cpu);
195
196 ep.buffer = &cb->qsi;
197 smp_call_function_single(cpu, execute_qsi, &ep, 1);
198 if (ep.rc)
199 printk(KERN_ERR "hwsampler: CPU %d CPUMF QSI failed.\n", cpu);
200
201 return rc;
202}
203
204static int smp_ctl_qsi(int cpu)
205{
206 struct hws_execute_parms ep;
207 struct hws_cpu_buffer *cb;
208
209 cb = &per_cpu(sampler_cpu_buffer, cpu);
210
211 ep.buffer = &cb->qsi;
212 smp_call_function_single(cpu, execute_qsi, &ep, 1);
213
214 return ep.rc;
215}
216
217static inline unsigned long *trailer_entry_ptr(unsigned long v)
218{
219 void *ret;
220
221 ret = (void *)v;
222 ret += PAGE_SIZE;
223 ret -= sizeof(struct hws_trailer_entry);
224
225 return (unsigned long *) ret;
226}
227
Heiko Carstensfde15c32012-03-11 11:59:31 -0400228static void hws_ext_handler(struct ext_code ext_code,
Jan Glauberb03d541a2012-03-23 11:13:05 +0100229 unsigned int param32, unsigned long param64)
230{
231 struct hws_cpu_buffer *cb = &__get_cpu_var(sampler_cpu_buffer);
232
233 if (!(param32 & CPU_MF_INT_SF_MASK))
234 return;
235
Hendrik Brueckner02456162012-05-09 16:27:40 +0200236 kstat_cpu(smp_processor_id()).irqs[EXTINT_CMS]++;
Jan Glauberb03d541a2012-03-23 11:13:05 +0100237 atomic_xchg(&cb->ext_params, atomic_read(&cb->ext_params) | param32);
238
239 if (hws_wq)
240 queue_work(hws_wq, &cb->worker);
241}
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000242
243static void worker(struct work_struct *work);
244
245static void add_samples_to_oprofile(unsigned cpu, unsigned long *,
246 unsigned long *dear);
247
248static void init_all_cpu_buffers(void)
249{
250 int cpu;
251 struct hws_cpu_buffer *cb;
252
253 for_each_online_cpu(cpu) {
254 cb = &per_cpu(sampler_cpu_buffer, cpu);
255 memset(cb, 0, sizeof(struct hws_cpu_buffer));
256 }
257}
258
259static int is_link_entry(unsigned long *s)
260{
261 return *s & 0x1ul ? 1 : 0;
262}
263
264static unsigned long *get_next_sdbt(unsigned long *s)
265{
266 return (unsigned long *) (*s & ~0x1ul);
267}
268
269static int prepare_cpu_buffers(void)
270{
271 int cpu;
272 int rc;
273 struct hws_cpu_buffer *cb;
274
275 rc = 0;
276 for_each_online_cpu(cpu) {
277 cb = &per_cpu(sampler_cpu_buffer, cpu);
278 atomic_set(&cb->ext_params, 0);
279 cb->worker_entry = 0;
280 cb->sample_overflow = 0;
281 cb->req_alert = 0;
282 cb->incorrect_sdbt_entry = 0;
283 cb->invalid_entry_address = 0;
284 cb->loss_of_sample_data = 0;
285 cb->sample_auth_change_alert = 0;
286 cb->finish = 0;
287 cb->oom = 0;
288 cb->stop_mode = 0;
289 }
290
291 return rc;
292}
293
294/*
295 * allocate_sdbt() - allocate sampler memory
296 * @cpu: the cpu for which sampler memory is allocated
297 *
298 * A 4K page is allocated for each requested SDBT.
299 * A maximum of 511 4K pages are allocated for the SDBs in each of the SDBTs.
300 * Set ALERT_REQ mask in each SDBs trailer.
301 * Returns zero if successful, <0 otherwise.
302 */
303static int allocate_sdbt(int cpu)
304{
305 int j, k, rc;
306 unsigned long *sdbt;
307 unsigned long sdb;
308 unsigned long *tail;
309 unsigned long *trailer;
310 struct hws_cpu_buffer *cb;
311
312 cb = &per_cpu(sampler_cpu_buffer, cpu);
313
314 if (cb->first_sdbt)
315 return -EINVAL;
316
317 sdbt = NULL;
318 tail = sdbt;
319
320 for (j = 0; j < num_sdbt; j++) {
321 sdbt = (unsigned long *)get_zeroed_page(GFP_KERNEL);
322
323 mutex_lock(&hws_sem_oom);
324 /* OOM killer might have been activated */
325 barrier();
326 if (oom_killer_was_active || !sdbt) {
327 if (sdbt)
328 free_page((unsigned long)sdbt);
329
330 goto allocate_sdbt_error;
331 }
332 if (cb->first_sdbt == 0)
333 cb->first_sdbt = (unsigned long)sdbt;
334
335 /* link current page to tail of chain */
336 if (tail)
337 *tail = (unsigned long)(void *)sdbt + 1;
338
339 mutex_unlock(&hws_sem_oom);
340
341 for (k = 0; k < num_sdb; k++) {
342 /* get and set SDB page */
343 sdb = get_zeroed_page(GFP_KERNEL);
344
345 mutex_lock(&hws_sem_oom);
346 /* OOM killer might have been activated */
347 barrier();
348 if (oom_killer_was_active || !sdb) {
349 if (sdb)
350 free_page(sdb);
351
352 goto allocate_sdbt_error;
353 }
354 *sdbt = sdb;
355 trailer = trailer_entry_ptr(*sdbt);
356 *trailer = ALERT_REQ_MASK;
357 sdbt++;
358 mutex_unlock(&hws_sem_oom);
359 }
360 tail = sdbt;
361 }
362 mutex_lock(&hws_sem_oom);
363 if (oom_killer_was_active)
364 goto allocate_sdbt_error;
365
366 rc = 0;
367 if (tail)
368 *tail = (unsigned long)
369 ((void *)cb->first_sdbt) + 1;
370
371allocate_sdbt_exit:
372 mutex_unlock(&hws_sem_oom);
373 return rc;
374
375allocate_sdbt_error:
376 rc = -ENOMEM;
377 goto allocate_sdbt_exit;
378}
379
380/*
381 * deallocate_sdbt() - deallocate all sampler memory
382 *
383 * For each online CPU all SDBT trees are deallocated.
384 * Returns the number of freed pages.
385 */
386static int deallocate_sdbt(void)
387{
388 int cpu;
389 int counter;
390
391 counter = 0;
392
393 for_each_online_cpu(cpu) {
394 unsigned long start;
395 unsigned long sdbt;
396 unsigned long *curr;
397 struct hws_cpu_buffer *cb;
398
399 cb = &per_cpu(sampler_cpu_buffer, cpu);
400
401 if (!cb->first_sdbt)
402 continue;
403
404 sdbt = cb->first_sdbt;
405 curr = (unsigned long *) sdbt;
406 start = sdbt;
407
408 /* we'll free the SDBT after all SDBs are processed... */
409 while (1) {
410 if (!*curr || !sdbt)
411 break;
412
413 /* watch for link entry reset if found */
414 if (is_link_entry(curr)) {
415 curr = get_next_sdbt(curr);
416 if (sdbt)
417 free_page(sdbt);
418
419 /* we are done if we reach the start */
420 if ((unsigned long) curr == start)
421 break;
422 else
423 sdbt = (unsigned long) curr;
424 } else {
425 /* process SDB pointer */
426 if (*curr) {
427 free_page(*curr);
428 curr++;
429 }
430 }
431 counter++;
432 }
433 cb->first_sdbt = 0;
434 }
435 return counter;
436}
437
438static int start_sampling(int cpu)
439{
440 int rc;
441 struct hws_cpu_buffer *cb;
442
443 cb = &per_cpu(sampler_cpu_buffer, cpu);
444 rc = smp_ctl_ssctl_enable_activate(cpu, interval);
445 if (rc) {
446 printk(KERN_INFO "hwsampler: CPU %d ssctl failed.\n", cpu);
447 goto start_exit;
448 }
449
450 rc = -EINVAL;
451 if (!cb->qsi.es) {
452 printk(KERN_INFO "hwsampler: CPU %d ssctl not enabled.\n", cpu);
453 goto start_exit;
454 }
455
456 if (!cb->qsi.cs) {
457 printk(KERN_INFO "hwsampler: CPU %d ssctl not active.\n", cpu);
458 goto start_exit;
459 }
460
461 printk(KERN_INFO
462 "hwsampler: CPU %d, CPUMF Sampling started, interval %lu.\n",
463 cpu, interval);
464
465 rc = 0;
466
467start_exit:
468 return rc;
469}
470
471static int stop_sampling(int cpu)
472{
473 unsigned long v;
474 int rc;
475 struct hws_cpu_buffer *cb;
476
477 rc = smp_ctl_qsi(cpu);
478 WARN_ON(rc);
479
480 cb = &per_cpu(sampler_cpu_buffer, cpu);
481 if (!rc && !cb->qsi.es)
482 printk(KERN_INFO "hwsampler: CPU %d, already stopped.\n", cpu);
483
484 rc = smp_ctl_ssctl_stop(cpu);
485 if (rc) {
486 printk(KERN_INFO "hwsampler: CPU %d, ssctl stop error %d.\n",
487 cpu, rc);
488 goto stop_exit;
489 }
490
491 printk(KERN_INFO "hwsampler: CPU %d, CPUMF Sampling stopped.\n", cpu);
492
493stop_exit:
494 v = cb->req_alert;
495 if (v)
496 printk(KERN_ERR "hwsampler: CPU %d CPUMF Request alert,"
497 " count=%lu.\n", cpu, v);
498
499 v = cb->loss_of_sample_data;
500 if (v)
501 printk(KERN_ERR "hwsampler: CPU %d CPUMF Loss of sample data,"
502 " count=%lu.\n", cpu, v);
503
504 v = cb->invalid_entry_address;
505 if (v)
506 printk(KERN_ERR "hwsampler: CPU %d CPUMF Invalid entry address,"
507 " count=%lu.\n", cpu, v);
508
509 v = cb->incorrect_sdbt_entry;
510 if (v)
511 printk(KERN_ERR
512 "hwsampler: CPU %d CPUMF Incorrect SDBT address,"
513 " count=%lu.\n", cpu, v);
514
515 v = cb->sample_auth_change_alert;
516 if (v)
517 printk(KERN_ERR
518 "hwsampler: CPU %d CPUMF Sample authorization change,"
519 " count=%lu.\n", cpu, v);
520
521 return rc;
522}
523
524static int check_hardware_prerequisites(void)
525{
Jan Glauber65a94b12011-04-04 09:43:29 +0200526 if (!test_facility(68))
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000527 return -EOPNOTSUPP;
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000528 return 0;
529}
530/*
531 * hws_oom_callback() - the OOM callback function
532 *
533 * In case the callback is invoked during memory allocation for the
534 * hw sampler, all obtained memory is deallocated and a flag is set
535 * so main sampler memory allocation can exit with a failure code.
536 * In case the callback is invoked during sampling the hw sampler
537 * is deactivated for all CPUs.
538 */
539static int hws_oom_callback(struct notifier_block *nfb,
540 unsigned long dummy, void *parm)
541{
542 unsigned long *freed;
543 int cpu;
544 struct hws_cpu_buffer *cb;
545
546 freed = parm;
547
548 mutex_lock(&hws_sem_oom);
549
550 if (hws_state == HWS_DEALLOCATED) {
551 /* during memory allocation */
552 if (oom_killer_was_active == 0) {
553 oom_killer_was_active = 1;
554 *freed += deallocate_sdbt();
555 }
556 } else {
557 int i;
558 cpu = get_cpu();
559 cb = &per_cpu(sampler_cpu_buffer, cpu);
560
561 if (!cb->oom) {
562 for_each_online_cpu(i) {
563 smp_ctl_ssctl_deactivate(i);
564 cb->oom = 1;
565 }
566 cb->finish = 1;
567
568 printk(KERN_INFO
569 "hwsampler: CPU %d, OOM notify during CPUMF Sampling.\n",
570 cpu);
571 }
572 }
573
574 mutex_unlock(&hws_sem_oom);
575
576 return NOTIFY_OK;
577}
578
579static struct notifier_block hws_oom_notifier = {
580 .notifier_call = hws_oom_callback
581};
582
Robert Richter7bb2e262011-02-14 19:08:33 +0100583static int hws_cpu_callback(struct notifier_block *nfb,
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000584 unsigned long action, void *hcpu)
585{
586 /* We do not have sampler space available for all possible CPUs.
587 All CPUs should be online when hw sampling is activated. */
Martin Schwidefskyb07c9012011-05-26 09:48:26 +0200588 return (hws_state <= HWS_DEALLOCATED) ? NOTIFY_OK : NOTIFY_BAD;
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000589}
590
591static struct notifier_block hws_cpu_notifier = {
592 .notifier_call = hws_cpu_callback
593};
594
595/**
596 * hwsampler_deactivate() - set hardware sampling temporarily inactive
597 * @cpu: specifies the CPU to be set inactive.
598 *
599 * Returns 0 on success, !0 on failure.
600 */
601int hwsampler_deactivate(unsigned int cpu)
602{
603 /*
604 * Deactivate hw sampling temporarily and flush the buffer
605 * by pushing all the pending samples to oprofile buffer.
606 *
607 * This function can be called under one of the following conditions:
608 * Memory unmap, task is exiting.
609 */
610 int rc;
611 struct hws_cpu_buffer *cb;
612
613 rc = 0;
614 mutex_lock(&hws_sem);
615
616 cb = &per_cpu(sampler_cpu_buffer, cpu);
617 if (hws_state == HWS_STARTED) {
618 rc = smp_ctl_qsi(cpu);
619 WARN_ON(rc);
620 if (cb->qsi.cs) {
621 rc = smp_ctl_ssctl_deactivate(cpu);
622 if (rc) {
623 printk(KERN_INFO
624 "hwsampler: CPU %d, CPUMF Deactivation failed.\n", cpu);
625 cb->finish = 1;
626 hws_state = HWS_STOPPING;
627 } else {
628 hws_flush_all = 1;
629 /* Add work to queue to read pending samples.*/
630 queue_work_on(cpu, hws_wq, &cb->worker);
631 }
632 }
633 }
634 mutex_unlock(&hws_sem);
635
636 if (hws_wq)
637 flush_workqueue(hws_wq);
638
639 return rc;
640}
641
642/**
643 * hwsampler_activate() - activate/resume hardware sampling which was deactivated
644 * @cpu: specifies the CPU to be set active.
645 *
646 * Returns 0 on success, !0 on failure.
647 */
648int hwsampler_activate(unsigned int cpu)
649{
650 /*
651 * Re-activate hw sampling. This should be called in pair with
652 * hwsampler_deactivate().
653 */
654 int rc;
655 struct hws_cpu_buffer *cb;
656
657 rc = 0;
658 mutex_lock(&hws_sem);
659
660 cb = &per_cpu(sampler_cpu_buffer, cpu);
661 if (hws_state == HWS_STARTED) {
662 rc = smp_ctl_qsi(cpu);
663 WARN_ON(rc);
664 if (!cb->qsi.cs) {
665 hws_flush_all = 0;
666 rc = smp_ctl_ssctl_enable_activate(cpu, interval);
667 if (rc) {
668 printk(KERN_ERR
669 "CPU %d, CPUMF activate sampling failed.\n",
670 cpu);
671 }
672 }
673 }
674
675 mutex_unlock(&hws_sem);
676
677 return rc;
678}
679
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000680static int check_qsi_on_setup(void)
681{
682 int rc;
683 unsigned int cpu;
684 struct hws_cpu_buffer *cb;
685
686 for_each_online_cpu(cpu) {
687 cb = &per_cpu(sampler_cpu_buffer, cpu);
688 rc = smp_ctl_qsi(cpu);
689 WARN_ON(rc);
690 if (rc)
691 return -EOPNOTSUPP;
692
693 if (!cb->qsi.as) {
694 printk(KERN_INFO "hwsampler: CPUMF sampling is not authorized.\n");
695 return -EINVAL;
696 }
697
698 if (cb->qsi.es) {
699 printk(KERN_WARNING "hwsampler: CPUMF is still enabled.\n");
700 rc = smp_ctl_ssctl_stop(cpu);
701 if (rc)
702 return -EINVAL;
703
704 printk(KERN_INFO
705 "CPU %d, CPUMF Sampling stopped now.\n", cpu);
706 }
707 }
708 return 0;
709}
710
711static int check_qsi_on_start(void)
712{
713 unsigned int cpu;
714 int rc;
715 struct hws_cpu_buffer *cb;
716
717 for_each_online_cpu(cpu) {
718 cb = &per_cpu(sampler_cpu_buffer, cpu);
719 rc = smp_ctl_qsi(cpu);
720 WARN_ON(rc);
721
722 if (!cb->qsi.as)
723 return -EINVAL;
724
725 if (cb->qsi.es)
726 return -EINVAL;
727
728 if (cb->qsi.cs)
729 return -EINVAL;
730 }
731 return 0;
732}
733
734static void worker_on_start(unsigned int cpu)
735{
736 struct hws_cpu_buffer *cb;
737
738 cb = &per_cpu(sampler_cpu_buffer, cpu);
739 cb->worker_entry = cb->first_sdbt;
740}
741
742static int worker_check_error(unsigned int cpu, int ext_params)
743{
744 int rc;
745 unsigned long *sdbt;
746 struct hws_cpu_buffer *cb;
747
748 rc = 0;
749 cb = &per_cpu(sampler_cpu_buffer, cpu);
750 sdbt = (unsigned long *) cb->worker_entry;
751
752 if (!sdbt || !*sdbt)
753 return -EINVAL;
754
Jan Glauberb03d541a2012-03-23 11:13:05 +0100755 if (ext_params & CPU_MF_INT_SF_PRA)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000756 cb->req_alert++;
757
Jan Glauberb03d541a2012-03-23 11:13:05 +0100758 if (ext_params & CPU_MF_INT_SF_LSDA)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000759 cb->loss_of_sample_data++;
760
Jan Glauberb03d541a2012-03-23 11:13:05 +0100761 if (ext_params & CPU_MF_INT_SF_IAE) {
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000762 cb->invalid_entry_address++;
763 rc = -EINVAL;
764 }
765
Jan Glauberb03d541a2012-03-23 11:13:05 +0100766 if (ext_params & CPU_MF_INT_SF_ISE) {
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000767 cb->incorrect_sdbt_entry++;
768 rc = -EINVAL;
769 }
770
Jan Glauberb03d541a2012-03-23 11:13:05 +0100771 if (ext_params & CPU_MF_INT_SF_SACA) {
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000772 cb->sample_auth_change_alert++;
773 rc = -EINVAL;
774 }
775
776 return rc;
777}
778
779static void worker_on_finish(unsigned int cpu)
780{
781 int rc, i;
782 struct hws_cpu_buffer *cb;
783
784 cb = &per_cpu(sampler_cpu_buffer, cpu);
785
786 if (cb->finish) {
787 rc = smp_ctl_qsi(cpu);
788 WARN_ON(rc);
789 if (cb->qsi.es) {
790 printk(KERN_INFO
791 "hwsampler: CPU %d, CPUMF Stop/Deactivate sampling.\n",
792 cpu);
793 rc = smp_ctl_ssctl_stop(cpu);
794 if (rc)
795 printk(KERN_INFO
796 "hwsampler: CPU %d, CPUMF Deactivation failed.\n",
797 cpu);
798
799 for_each_online_cpu(i) {
800 if (i == cpu)
801 continue;
802 if (!cb->finish) {
803 cb->finish = 1;
804 queue_work_on(i, hws_wq,
805 &cb->worker);
806 }
807 }
808 }
809 }
810}
811
812static void worker_on_interrupt(unsigned int cpu)
813{
814 unsigned long *sdbt;
815 unsigned char done;
816 struct hws_cpu_buffer *cb;
817
818 cb = &per_cpu(sampler_cpu_buffer, cpu);
819
820 sdbt = (unsigned long *) cb->worker_entry;
821
822 done = 0;
823 /* do not proceed if stop was entered,
824 * forget the buffers not yet processed */
825 while (!done && !cb->stop_mode) {
826 unsigned long *trailer;
827 struct hws_trailer_entry *te;
828 unsigned long *dear = 0;
829
830 trailer = trailer_entry_ptr(*sdbt);
831 /* leave loop if no more work to do */
832 if (!(*trailer & BUFFER_FULL_MASK)) {
833 done = 1;
834 if (!hws_flush_all)
835 continue;
836 }
837
838 te = (struct hws_trailer_entry *)trailer;
839 cb->sample_overflow += te->overflow;
840
841 add_samples_to_oprofile(cpu, sdbt, dear);
842
843 /* reset trailer */
844 xchg((unsigned char *) te, 0x40);
845
846 /* advance to next sdb slot in current sdbt */
847 sdbt++;
848 /* in case link bit is set use address w/o link bit */
849 if (is_link_entry(sdbt))
850 sdbt = get_next_sdbt(sdbt);
851
852 cb->worker_entry = (unsigned long)sdbt;
853 }
854}
855
856static void add_samples_to_oprofile(unsigned int cpu, unsigned long *sdbt,
857 unsigned long *dear)
858{
859 struct hws_data_entry *sample_data_ptr;
860 unsigned long *trailer;
861
862 trailer = trailer_entry_ptr(*sdbt);
863 if (dear) {
864 if (dear > trailer)
865 return;
866 trailer = dear;
867 }
868
869 sample_data_ptr = (struct hws_data_entry *)(*sdbt);
870
871 while ((unsigned long *)sample_data_ptr < trailer) {
872 struct pt_regs *regs = NULL;
873 struct task_struct *tsk = NULL;
874
875 /*
876 * Check sampling mode, 1 indicates basic (=customer) sampling
877 * mode.
878 */
879 if (sample_data_ptr->def != 1) {
880 /* sample slot is not yet written */
881 break;
882 } else {
883 /* make sure we don't use it twice,
884 * the next time the sampler will set it again */
885 sample_data_ptr->def = 0;
886 }
887
888 /* Get pt_regs. */
889 if (sample_data_ptr->P == 1) {
890 /* userspace sample */
891 unsigned int pid = sample_data_ptr->prim_asn;
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100892 if (!counter_config.user)
893 goto skip_sample;
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000894 rcu_read_lock();
895 tsk = pid_task(find_vpid(pid), PIDTYPE_PID);
896 if (tsk)
897 regs = task_pt_regs(tsk);
898 rcu_read_unlock();
899 } else {
900 /* kernelspace sample */
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100901 if (!counter_config.kernel)
902 goto skip_sample;
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000903 regs = task_pt_regs(current);
904 }
905
906 mutex_lock(&hws_sem);
907 oprofile_add_ext_hw_sample(sample_data_ptr->ia, regs, 0,
908 !sample_data_ptr->P, tsk);
909 mutex_unlock(&hws_sem);
Andreas Krebbeldd3c4672011-11-25 20:03:05 +0100910 skip_sample:
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000911 sample_data_ptr++;
912 }
913}
914
915static void worker(struct work_struct *work)
916{
917 unsigned int cpu;
918 int ext_params;
919 struct hws_cpu_buffer *cb;
920
921 cb = container_of(work, struct hws_cpu_buffer, worker);
922 cpu = smp_processor_id();
923 ext_params = atomic_xchg(&cb->ext_params, 0);
924
925 if (!cb->worker_entry)
926 worker_on_start(cpu);
927
928 if (worker_check_error(cpu, ext_params))
929 return;
930
931 if (!cb->finish)
932 worker_on_interrupt(cpu);
933
934 if (cb->finish)
935 worker_on_finish(cpu);
936}
937
938/**
939 * hwsampler_allocate() - allocate memory for the hardware sampler
940 * @sdbt: number of SDBTs per online CPU (must be > 0)
941 * @sdb: number of SDBs per SDBT (minimum 1, maximum 511)
942 *
943 * Returns 0 on success, !0 on failure.
944 */
945int hwsampler_allocate(unsigned long sdbt, unsigned long sdb)
946{
947 int cpu, rc;
948 mutex_lock(&hws_sem);
949
950 rc = -EINVAL;
951 if (hws_state != HWS_DEALLOCATED)
952 goto allocate_exit;
953
954 if (sdbt < 1)
955 goto allocate_exit;
956
957 if (sdb > MAX_NUM_SDB || sdb < MIN_NUM_SDB)
958 goto allocate_exit;
959
960 num_sdbt = sdbt;
961 num_sdb = sdb;
962
963 oom_killer_was_active = 0;
964 register_oom_notifier(&hws_oom_notifier);
965
966 for_each_online_cpu(cpu) {
967 if (allocate_sdbt(cpu)) {
968 unregister_oom_notifier(&hws_oom_notifier);
969 goto allocate_error;
970 }
971 }
972 unregister_oom_notifier(&hws_oom_notifier);
973 if (oom_killer_was_active)
974 goto allocate_error;
975
976 hws_state = HWS_STOPPED;
977 rc = 0;
978
979allocate_exit:
980 mutex_unlock(&hws_sem);
981 return rc;
982
983allocate_error:
984 rc = -ENOMEM;
985 printk(KERN_ERR "hwsampler: CPUMF Memory allocation failed.\n");
986 goto allocate_exit;
987}
988
989/**
990 * hwsampler_deallocate() - deallocate hardware sampler memory
991 *
992 * Returns 0 on success, !0 on failure.
993 */
Martin Schwidefskye54aafa2011-10-30 15:17:12 +0100994int hwsampler_deallocate(void)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +0000995{
996 int rc;
997
998 mutex_lock(&hws_sem);
999
1000 rc = -EINVAL;
1001 if (hws_state != HWS_STOPPED)
1002 goto deallocate_exit;
1003
Jan Glauberb03d541a2012-03-23 11:13:05 +01001004 measurement_alert_subclass_unregister();
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001005 deallocate_sdbt();
1006
1007 hws_state = HWS_DEALLOCATED;
1008 rc = 0;
1009
1010deallocate_exit:
1011 mutex_unlock(&hws_sem);
1012
1013 return rc;
1014}
1015
Martin Schwidefsky3d8dcb32011-05-10 17:13:42 +02001016unsigned long hwsampler_query_min_interval(void)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001017{
Martin Schwidefsky3d8dcb32011-05-10 17:13:42 +02001018 return min_sampler_rate;
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001019}
1020
Martin Schwidefsky3d8dcb32011-05-10 17:13:42 +02001021unsigned long hwsampler_query_max_interval(void)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001022{
Martin Schwidefsky3d8dcb32011-05-10 17:13:42 +02001023 return max_sampler_rate;
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001024}
1025
1026unsigned long hwsampler_get_sample_overflow_count(unsigned int cpu)
1027{
1028 struct hws_cpu_buffer *cb;
1029
1030 cb = &per_cpu(sampler_cpu_buffer, cpu);
1031
1032 return cb->sample_overflow;
1033}
1034
Martin Schwidefskye54aafa2011-10-30 15:17:12 +01001035int hwsampler_setup(void)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001036{
1037 int rc;
1038 int cpu;
1039 struct hws_cpu_buffer *cb;
1040
1041 mutex_lock(&hws_sem);
1042
1043 rc = -EINVAL;
1044 if (hws_state)
1045 goto setup_exit;
1046
1047 hws_state = HWS_INIT;
1048
1049 init_all_cpu_buffers();
1050
1051 rc = check_hardware_prerequisites();
1052 if (rc)
1053 goto setup_exit;
1054
1055 rc = check_qsi_on_setup();
1056 if (rc)
1057 goto setup_exit;
1058
1059 rc = -EINVAL;
1060 hws_wq = create_workqueue("hwsampler");
1061 if (!hws_wq)
1062 goto setup_exit;
1063
1064 register_cpu_notifier(&hws_cpu_notifier);
1065
1066 for_each_online_cpu(cpu) {
1067 cb = &per_cpu(sampler_cpu_buffer, cpu);
1068 INIT_WORK(&cb->worker, worker);
1069 rc = smp_ctl_qsi(cpu);
1070 WARN_ON(rc);
1071 if (min_sampler_rate != cb->qsi.min_sampl_rate) {
1072 if (min_sampler_rate) {
1073 printk(KERN_WARNING
1074 "hwsampler: different min sampler rate values.\n");
1075 if (min_sampler_rate < cb->qsi.min_sampl_rate)
1076 min_sampler_rate =
1077 cb->qsi.min_sampl_rate;
1078 } else
1079 min_sampler_rate = cb->qsi.min_sampl_rate;
1080 }
1081 if (max_sampler_rate != cb->qsi.max_sampl_rate) {
1082 if (max_sampler_rate) {
1083 printk(KERN_WARNING
1084 "hwsampler: different max sampler rate values.\n");
1085 if (max_sampler_rate > cb->qsi.max_sampl_rate)
1086 max_sampler_rate =
1087 cb->qsi.max_sampl_rate;
1088 } else
1089 max_sampler_rate = cb->qsi.max_sampl_rate;
1090 }
1091 }
1092 register_external_interrupt(0x1407, hws_ext_handler);
1093
1094 hws_state = HWS_DEALLOCATED;
1095 rc = 0;
1096
1097setup_exit:
1098 mutex_unlock(&hws_sem);
1099 return rc;
1100}
1101
Martin Schwidefskye54aafa2011-10-30 15:17:12 +01001102int hwsampler_shutdown(void)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001103{
1104 int rc;
1105
1106 mutex_lock(&hws_sem);
1107
1108 rc = -EINVAL;
1109 if (hws_state == HWS_DEALLOCATED || hws_state == HWS_STOPPED) {
1110 mutex_unlock(&hws_sem);
1111
1112 if (hws_wq)
1113 flush_workqueue(hws_wq);
1114
1115 mutex_lock(&hws_sem);
1116
1117 if (hws_state == HWS_STOPPED) {
Jan Glauberb03d541a2012-03-23 11:13:05 +01001118 measurement_alert_subclass_unregister();
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001119 deallocate_sdbt();
1120 }
1121 if (hws_wq) {
1122 destroy_workqueue(hws_wq);
1123 hws_wq = NULL;
1124 }
1125
1126 unregister_external_interrupt(0x1407, hws_ext_handler);
1127 hws_state = HWS_INIT;
1128 rc = 0;
1129 }
1130 mutex_unlock(&hws_sem);
1131
1132 unregister_cpu_notifier(&hws_cpu_notifier);
1133
1134 return rc;
1135}
1136
1137/**
1138 * hwsampler_start_all() - start hardware sampling on all online CPUs
1139 * @rate: specifies the used interval when samples are taken
1140 *
1141 * Returns 0 on success, !0 on failure.
1142 */
1143int hwsampler_start_all(unsigned long rate)
1144{
1145 int rc, cpu;
1146
1147 mutex_lock(&hws_sem);
1148
1149 hws_oom = 0;
1150
1151 rc = -EINVAL;
1152 if (hws_state != HWS_STOPPED)
1153 goto start_all_exit;
1154
1155 interval = rate;
1156
1157 /* fail if rate is not valid */
1158 if (interval < min_sampler_rate || interval > max_sampler_rate)
1159 goto start_all_exit;
1160
1161 rc = check_qsi_on_start();
1162 if (rc)
1163 goto start_all_exit;
1164
1165 rc = prepare_cpu_buffers();
1166 if (rc)
1167 goto start_all_exit;
1168
1169 for_each_online_cpu(cpu) {
1170 rc = start_sampling(cpu);
1171 if (rc)
1172 break;
1173 }
1174 if (rc) {
1175 for_each_online_cpu(cpu) {
1176 stop_sampling(cpu);
1177 }
1178 goto start_all_exit;
1179 }
1180 hws_state = HWS_STARTED;
1181 rc = 0;
1182
1183start_all_exit:
1184 mutex_unlock(&hws_sem);
1185
1186 if (rc)
1187 return rc;
1188
1189 register_oom_notifier(&hws_oom_notifier);
1190 hws_oom = 1;
1191 hws_flush_all = 0;
1192 /* now let them in, 1407 CPUMF external interrupts */
Jan Glauberb03d541a2012-03-23 11:13:05 +01001193 measurement_alert_subclass_register();
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001194
1195 return 0;
1196}
1197
1198/**
1199 * hwsampler_stop_all() - stop hardware sampling on all online CPUs
1200 *
1201 * Returns 0 on success, !0 on failure.
1202 */
Martin Schwidefskye54aafa2011-10-30 15:17:12 +01001203int hwsampler_stop_all(void)
Heinz Graalfsec6a3df2011-01-21 10:06:52 +00001204{
1205 int tmp_rc, rc, cpu;
1206 struct hws_cpu_buffer *cb;
1207
1208 mutex_lock(&hws_sem);
1209
1210 rc = 0;
1211 if (hws_state == HWS_INIT) {
1212 mutex_unlock(&hws_sem);
1213 return rc;
1214 }
1215 hws_state = HWS_STOPPING;
1216 mutex_unlock(&hws_sem);
1217
1218 for_each_online_cpu(cpu) {
1219 cb = &per_cpu(sampler_cpu_buffer, cpu);
1220 cb->stop_mode = 1;
1221 tmp_rc = stop_sampling(cpu);
1222 if (tmp_rc)
1223 rc = tmp_rc;
1224 }
1225
1226 if (hws_wq)
1227 flush_workqueue(hws_wq);
1228
1229 mutex_lock(&hws_sem);
1230 if (hws_oom) {
1231 unregister_oom_notifier(&hws_oom_notifier);
1232 hws_oom = 0;
1233 }
1234 hws_state = HWS_STOPPED;
1235 mutex_unlock(&hws_sem);
1236
1237 return rc;
1238}