]> git.kernelconcepts.de Git - karo-tx-linux.git/blob - arch/s390/oprofile/hwsampler.c
block: Fix front merge check
[karo-tx-linux.git] / arch / s390 / oprofile / hwsampler.c
1 /*
2  * Copyright IBM Corp. 2010
3  * Author: Heinz Graalfs <graalfs@de.ibm.com>
4  */
5
6 #include <linux/kernel_stat.h>
7 #include <linux/kernel.h>
8 #include <linux/module.h>
9 #include <linux/smp.h>
10 #include <linux/errno.h>
11 #include <linux/workqueue.h>
12 #include <linux/interrupt.h>
13 #include <linux/notifier.h>
14 #include <linux/cpu.h>
15 #include <linux/semaphore.h>
16 #include <linux/oom.h>
17 #include <linux/oprofile.h>
18
19 #include <asm/facility.h>
20 #include <asm/cpu_mf.h>
21 #include <asm/irq.h>
22
23 #include "hwsampler.h"
24 #include "op_counter.h"
25
26 #define MAX_NUM_SDB 511
27 #define MIN_NUM_SDB 1
28
29 DECLARE_PER_CPU(struct hws_cpu_buffer, sampler_cpu_buffer);
30
31 struct hws_execute_parms {
32         void *buffer;
33         signed int rc;
34 };
35
36 DEFINE_PER_CPU(struct hws_cpu_buffer, sampler_cpu_buffer);
37 EXPORT_PER_CPU_SYMBOL(sampler_cpu_buffer);
38
39 static DEFINE_MUTEX(hws_sem);
40 static DEFINE_MUTEX(hws_sem_oom);
41
42 static unsigned char hws_flush_all;
43 static unsigned int hws_oom;
44 static unsigned int hws_alert;
45 static struct workqueue_struct *hws_wq;
46
47 static unsigned int hws_state;
48 enum {
49         HWS_INIT = 1,
50         HWS_DEALLOCATED,
51         HWS_STOPPED,
52         HWS_STARTED,
53         HWS_STOPPING };
54
55 /* set to 1 if called by kernel during memory allocation */
56 static unsigned char oom_killer_was_active;
57 /* size of SDBT and SDB as of allocate API */
58 static unsigned long num_sdbt = 100;
59 static unsigned long num_sdb = 511;
60 /* sampling interval (machine cycles) */
61 static unsigned long interval;
62
63 static unsigned long min_sampler_rate;
64 static unsigned long max_sampler_rate;
65
66 static void execute_qsi(void *parms)
67 {
68         struct hws_execute_parms *ep = parms;
69
70         ep->rc = qsi(ep->buffer);
71 }
72
73 static void execute_ssctl(void *parms)
74 {
75         struct hws_execute_parms *ep = parms;
76
77         ep->rc = lsctl(ep->buffer);
78 }
79
80 static int smp_ctl_ssctl_stop(int cpu)
81 {
82         int rc;
83         struct hws_execute_parms ep;
84         struct hws_cpu_buffer *cb;
85
86         cb = &per_cpu(sampler_cpu_buffer, cpu);
87
88         cb->ssctl.es = 0;
89         cb->ssctl.cs = 0;
90
91         ep.buffer = &cb->ssctl;
92         smp_call_function_single(cpu, execute_ssctl, &ep, 1);
93         rc = ep.rc;
94         if (rc) {
95                 printk(KERN_ERR "hwsampler: CPU %d CPUMF SSCTL failed.\n", cpu);
96                 dump_stack();
97         }
98
99         ep.buffer = &cb->qsi;
100         smp_call_function_single(cpu, execute_qsi, &ep, 1);
101
102         if (cb->qsi.es || cb->qsi.cs) {
103                 printk(KERN_EMERG "CPUMF sampling did not stop properly.\n");
104                 dump_stack();
105         }
106
107         return rc;
108 }
109
110 static int smp_ctl_ssctl_deactivate(int cpu)
111 {
112         int rc;
113         struct hws_execute_parms ep;
114         struct hws_cpu_buffer *cb;
115
116         cb = &per_cpu(sampler_cpu_buffer, cpu);
117
118         cb->ssctl.es = 1;
119         cb->ssctl.cs = 0;
120
121         ep.buffer = &cb->ssctl;
122         smp_call_function_single(cpu, execute_ssctl, &ep, 1);
123         rc = ep.rc;
124         if (rc)
125                 printk(KERN_ERR "hwsampler: CPU %d CPUMF SSCTL failed.\n", cpu);
126
127         ep.buffer = &cb->qsi;
128         smp_call_function_single(cpu, execute_qsi, &ep, 1);
129
130         if (cb->qsi.cs)
131                 printk(KERN_EMERG "CPUMF sampling was not set inactive.\n");
132
133         return rc;
134 }
135
136 static int smp_ctl_ssctl_enable_activate(int cpu, unsigned long interval)
137 {
138         int rc;
139         struct hws_execute_parms ep;
140         struct hws_cpu_buffer *cb;
141
142         cb = &per_cpu(sampler_cpu_buffer, cpu);
143
144         cb->ssctl.h = 1;
145         cb->ssctl.tear = cb->first_sdbt;
146         cb->ssctl.dear = *(unsigned long *) cb->first_sdbt;
147         cb->ssctl.interval = interval;
148         cb->ssctl.es = 1;
149         cb->ssctl.cs = 1;
150
151         ep.buffer = &cb->ssctl;
152         smp_call_function_single(cpu, execute_ssctl, &ep, 1);
153         rc = ep.rc;
154         if (rc)
155                 printk(KERN_ERR "hwsampler: CPU %d CPUMF SSCTL failed.\n", cpu);
156
157         ep.buffer = &cb->qsi;
158         smp_call_function_single(cpu, execute_qsi, &ep, 1);
159         if (ep.rc)
160                 printk(KERN_ERR "hwsampler: CPU %d CPUMF QSI failed.\n", cpu);
161
162         return rc;
163 }
164
165 static int smp_ctl_qsi(int cpu)
166 {
167         struct hws_execute_parms ep;
168         struct hws_cpu_buffer *cb;
169
170         cb = &per_cpu(sampler_cpu_buffer, cpu);
171
172         ep.buffer = &cb->qsi;
173         smp_call_function_single(cpu, execute_qsi, &ep, 1);
174
175         return ep.rc;
176 }
177
178 static void hws_ext_handler(struct ext_code ext_code,
179                             unsigned int param32, unsigned long param64)
180 {
181         struct hws_cpu_buffer *cb = this_cpu_ptr(&sampler_cpu_buffer);
182
183         if (!(param32 & CPU_MF_INT_SF_MASK))
184                 return;
185
186         if (!hws_alert)
187                 return;
188
189         inc_irq_stat(IRQEXT_CMS);
190         atomic_xchg(&cb->ext_params, atomic_read(&cb->ext_params) | param32);
191
192         if (hws_wq)
193                 queue_work(hws_wq, &cb->worker);
194 }
195
196 static void worker(struct work_struct *work);
197
198 static void add_samples_to_oprofile(unsigned cpu, unsigned long *,
199                                 unsigned long *dear);
200
201 static void init_all_cpu_buffers(void)
202 {
203         int cpu;
204         struct hws_cpu_buffer *cb;
205
206         for_each_online_cpu(cpu) {
207                 cb = &per_cpu(sampler_cpu_buffer, cpu);
208                 memset(cb, 0, sizeof(struct hws_cpu_buffer));
209         }
210 }
211
212 static void prepare_cpu_buffers(void)
213 {
214         struct hws_cpu_buffer *cb;
215         int cpu;
216
217         for_each_online_cpu(cpu) {
218                 cb = &per_cpu(sampler_cpu_buffer, cpu);
219                 atomic_set(&cb->ext_params, 0);
220                 cb->worker_entry = 0;
221                 cb->sample_overflow = 0;
222                 cb->req_alert = 0;
223                 cb->incorrect_sdbt_entry = 0;
224                 cb->invalid_entry_address = 0;
225                 cb->loss_of_sample_data = 0;
226                 cb->sample_auth_change_alert = 0;
227                 cb->finish = 0;
228                 cb->oom = 0;
229                 cb->stop_mode = 0;
230         }
231 }
232
233 /*
234  * allocate_sdbt() - allocate sampler memory
235  * @cpu: the cpu for which sampler memory is allocated
236  *
237  * A 4K page is allocated for each requested SDBT.
238  * A maximum of 511 4K pages are allocated for the SDBs in each of the SDBTs.
239  * Set ALERT_REQ mask in each SDBs trailer.
240  * Returns zero if successful, <0 otherwise.
241  */
242 static int allocate_sdbt(int cpu)
243 {
244         int j, k, rc;
245         unsigned long *sdbt;
246         unsigned long  sdb;
247         unsigned long *tail;
248         unsigned long *trailer;
249         struct hws_cpu_buffer *cb;
250
251         cb = &per_cpu(sampler_cpu_buffer, cpu);
252
253         if (cb->first_sdbt)
254                 return -EINVAL;
255
256         sdbt = NULL;
257         tail = sdbt;
258
259         for (j = 0; j < num_sdbt; j++) {
260                 sdbt = (unsigned long *)get_zeroed_page(GFP_KERNEL);
261
262                 mutex_lock(&hws_sem_oom);
263                 /* OOM killer might have been activated */
264                 barrier();
265                 if (oom_killer_was_active || !sdbt) {
266                         if (sdbt)
267                                 free_page((unsigned long)sdbt);
268
269                         goto allocate_sdbt_error;
270                 }
271                 if (cb->first_sdbt == 0)
272                         cb->first_sdbt = (unsigned long)sdbt;
273
274                 /* link current page to tail of chain */
275                 if (tail)
276                         *tail = (unsigned long)(void *)sdbt + 1;
277
278                 mutex_unlock(&hws_sem_oom);
279
280                 for (k = 0; k < num_sdb; k++) {
281                         /* get and set SDB page */
282                         sdb = get_zeroed_page(GFP_KERNEL);
283
284                         mutex_lock(&hws_sem_oom);
285                         /* OOM killer might have been activated */
286                         barrier();
287                         if (oom_killer_was_active || !sdb) {
288                                 if (sdb)
289                                         free_page(sdb);
290
291                                 goto allocate_sdbt_error;
292                         }
293                         *sdbt = sdb;
294                         trailer = trailer_entry_ptr(*sdbt);
295                         *trailer = SDB_TE_ALERT_REQ_MASK;
296                         sdbt++;
297                         mutex_unlock(&hws_sem_oom);
298                 }
299                 tail = sdbt;
300         }
301         mutex_lock(&hws_sem_oom);
302         if (oom_killer_was_active)
303                 goto allocate_sdbt_error;
304
305         rc = 0;
306         if (tail)
307                 *tail = (unsigned long)
308                         ((void *)cb->first_sdbt) + 1;
309
310 allocate_sdbt_exit:
311         mutex_unlock(&hws_sem_oom);
312         return rc;
313
314 allocate_sdbt_error:
315         rc = -ENOMEM;
316         goto allocate_sdbt_exit;
317 }
318
319 /*
320  * deallocate_sdbt() - deallocate all sampler memory
321  *
322  * For each online CPU all SDBT trees are deallocated.
323  * Returns the number of freed pages.
324  */
325 static int deallocate_sdbt(void)
326 {
327         int cpu;
328         int counter;
329
330         counter = 0;
331
332         for_each_online_cpu(cpu) {
333                 unsigned long start;
334                 unsigned long sdbt;
335                 unsigned long *curr;
336                 struct hws_cpu_buffer *cb;
337
338                 cb = &per_cpu(sampler_cpu_buffer, cpu);
339
340                 if (!cb->first_sdbt)
341                         continue;
342
343                 sdbt = cb->first_sdbt;
344                 curr = (unsigned long *) sdbt;
345                 start = sdbt;
346
347                 /* we'll free the SDBT after all SDBs are processed... */
348                 while (1) {
349                         if (!*curr || !sdbt)
350                                 break;
351
352                         /* watch for link entry reset if found */
353                         if (is_link_entry(curr)) {
354                                 curr = get_next_sdbt(curr);
355                                 if (sdbt)
356                                         free_page(sdbt);
357
358                                 /* we are done if we reach the start */
359                                 if ((unsigned long) curr == start)
360                                         break;
361                                 else
362                                         sdbt = (unsigned long) curr;
363                         } else {
364                                 /* process SDB pointer */
365                                 if (*curr) {
366                                         free_page(*curr);
367                                         curr++;
368                                 }
369                         }
370                         counter++;
371                 }
372                 cb->first_sdbt = 0;
373         }
374         return counter;
375 }
376
377 static int start_sampling(int cpu)
378 {
379         int rc;
380         struct hws_cpu_buffer *cb;
381
382         cb = &per_cpu(sampler_cpu_buffer, cpu);
383         rc = smp_ctl_ssctl_enable_activate(cpu, interval);
384         if (rc) {
385                 printk(KERN_INFO "hwsampler: CPU %d ssctl failed.\n", cpu);
386                 goto start_exit;
387         }
388
389         rc = -EINVAL;
390         if (!cb->qsi.es) {
391                 printk(KERN_INFO "hwsampler: CPU %d ssctl not enabled.\n", cpu);
392                 goto start_exit;
393         }
394
395         if (!cb->qsi.cs) {
396                 printk(KERN_INFO "hwsampler: CPU %d ssctl not active.\n", cpu);
397                 goto start_exit;
398         }
399
400         printk(KERN_INFO
401                 "hwsampler: CPU %d, CPUMF Sampling started, interval %lu.\n",
402                 cpu, interval);
403
404         rc = 0;
405
406 start_exit:
407         return rc;
408 }
409
410 static int stop_sampling(int cpu)
411 {
412         unsigned long v;
413         int rc;
414         struct hws_cpu_buffer *cb;
415
416         rc = smp_ctl_qsi(cpu);
417         WARN_ON(rc);
418
419         cb = &per_cpu(sampler_cpu_buffer, cpu);
420         if (!rc && !cb->qsi.es)
421                 printk(KERN_INFO "hwsampler: CPU %d, already stopped.\n", cpu);
422
423         rc = smp_ctl_ssctl_stop(cpu);
424         if (rc) {
425                 printk(KERN_INFO "hwsampler: CPU %d, ssctl stop error %d.\n",
426                                 cpu, rc);
427                 goto stop_exit;
428         }
429
430         printk(KERN_INFO "hwsampler: CPU %d, CPUMF Sampling stopped.\n", cpu);
431
432 stop_exit:
433         v = cb->req_alert;
434         if (v)
435                 printk(KERN_ERR "hwsampler: CPU %d CPUMF Request alert,"
436                                 " count=%lu.\n", cpu, v);
437
438         v = cb->loss_of_sample_data;
439         if (v)
440                 printk(KERN_ERR "hwsampler: CPU %d CPUMF Loss of sample data,"
441                                 " count=%lu.\n", cpu, v);
442
443         v = cb->invalid_entry_address;
444         if (v)
445                 printk(KERN_ERR "hwsampler: CPU %d CPUMF Invalid entry address,"
446                                 " count=%lu.\n", cpu, v);
447
448         v = cb->incorrect_sdbt_entry;
449         if (v)
450                 printk(KERN_ERR
451                                 "hwsampler: CPU %d CPUMF Incorrect SDBT address,"
452                                 " count=%lu.\n", cpu, v);
453
454         v = cb->sample_auth_change_alert;
455         if (v)
456                 printk(KERN_ERR
457                                 "hwsampler: CPU %d CPUMF Sample authorization change,"
458                                 " count=%lu.\n", cpu, v);
459
460         return rc;
461 }
462
463 static int check_hardware_prerequisites(void)
464 {
465         if (!test_facility(68))
466                 return -EOPNOTSUPP;
467         return 0;
468 }
469 /*
470  * hws_oom_callback() - the OOM callback function
471  *
472  * In case the callback is invoked during memory allocation for the
473  *  hw sampler, all obtained memory is deallocated and a flag is set
474  *  so main sampler memory allocation can exit with a failure code.
475  * In case the callback is invoked during sampling the hw sampler
476  *  is deactivated for all CPUs.
477  */
478 static int hws_oom_callback(struct notifier_block *nfb,
479         unsigned long dummy, void *parm)
480 {
481         unsigned long *freed;
482         int cpu;
483         struct hws_cpu_buffer *cb;
484
485         freed = parm;
486
487         mutex_lock(&hws_sem_oom);
488
489         if (hws_state == HWS_DEALLOCATED) {
490                 /* during memory allocation */
491                 if (oom_killer_was_active == 0) {
492                         oom_killer_was_active = 1;
493                         *freed += deallocate_sdbt();
494                 }
495         } else {
496                 int i;
497                 cpu = get_cpu();
498                 cb = &per_cpu(sampler_cpu_buffer, cpu);
499
500                 if (!cb->oom) {
501                         for_each_online_cpu(i) {
502                                 smp_ctl_ssctl_deactivate(i);
503                                 cb->oom = 1;
504                         }
505                         cb->finish = 1;
506
507                         printk(KERN_INFO
508                                 "hwsampler: CPU %d, OOM notify during CPUMF Sampling.\n",
509                                 cpu);
510                 }
511         }
512
513         mutex_unlock(&hws_sem_oom);
514
515         return NOTIFY_OK;
516 }
517
518 static struct notifier_block hws_oom_notifier = {
519         .notifier_call = hws_oom_callback
520 };
521
522 static int hws_cpu_callback(struct notifier_block *nfb,
523         unsigned long action, void *hcpu)
524 {
525         /* We do not have sampler space available for all possible CPUs.
526            All CPUs should be online when hw sampling is activated. */
527         return (hws_state <= HWS_DEALLOCATED) ? NOTIFY_OK : NOTIFY_BAD;
528 }
529
530 static struct notifier_block hws_cpu_notifier = {
531         .notifier_call = hws_cpu_callback
532 };
533
534 /**
535  * hwsampler_deactivate() - set hardware sampling temporarily inactive
536  * @cpu:  specifies the CPU to be set inactive.
537  *
538  * Returns 0 on success, !0 on failure.
539  */
540 int hwsampler_deactivate(unsigned int cpu)
541 {
542         /*
543          * Deactivate hw sampling temporarily and flush the buffer
544          * by pushing all the pending samples to oprofile buffer.
545          *
546          * This function can be called under one of the following conditions:
547          *     Memory unmap, task is exiting.
548          */
549         int rc;
550         struct hws_cpu_buffer *cb;
551
552         rc = 0;
553         mutex_lock(&hws_sem);
554
555         cb = &per_cpu(sampler_cpu_buffer, cpu);
556         if (hws_state == HWS_STARTED) {
557                 rc = smp_ctl_qsi(cpu);
558                 WARN_ON(rc);
559                 if (cb->qsi.cs) {
560                         rc = smp_ctl_ssctl_deactivate(cpu);
561                         if (rc) {
562                                 printk(KERN_INFO
563                                 "hwsampler: CPU %d, CPUMF Deactivation failed.\n", cpu);
564                                 cb->finish = 1;
565                                 hws_state = HWS_STOPPING;
566                         } else  {
567                                 hws_flush_all = 1;
568                                 /* Add work to queue to read pending samples.*/
569                                 queue_work_on(cpu, hws_wq, &cb->worker);
570                         }
571                 }
572         }
573         mutex_unlock(&hws_sem);
574
575         if (hws_wq)
576                 flush_workqueue(hws_wq);
577
578         return rc;
579 }
580
581 /**
582  * hwsampler_activate() - activate/resume hardware sampling which was deactivated
583  * @cpu:  specifies the CPU to be set active.
584  *
585  * Returns 0 on success, !0 on failure.
586  */
587 int hwsampler_activate(unsigned int cpu)
588 {
589         /*
590          * Re-activate hw sampling. This should be called in pair with
591          * hwsampler_deactivate().
592          */
593         int rc;
594         struct hws_cpu_buffer *cb;
595
596         rc = 0;
597         mutex_lock(&hws_sem);
598
599         cb = &per_cpu(sampler_cpu_buffer, cpu);
600         if (hws_state == HWS_STARTED) {
601                 rc = smp_ctl_qsi(cpu);
602                 WARN_ON(rc);
603                 if (!cb->qsi.cs) {
604                         hws_flush_all = 0;
605                         rc = smp_ctl_ssctl_enable_activate(cpu, interval);
606                         if (rc) {
607                                 printk(KERN_ERR
608                                 "CPU %d, CPUMF activate sampling failed.\n",
609                                          cpu);
610                         }
611                 }
612         }
613
614         mutex_unlock(&hws_sem);
615
616         return rc;
617 }
618
619 static int check_qsi_on_setup(void)
620 {
621         int rc;
622         unsigned int cpu;
623         struct hws_cpu_buffer *cb;
624
625         for_each_online_cpu(cpu) {
626                 cb = &per_cpu(sampler_cpu_buffer, cpu);
627                 rc = smp_ctl_qsi(cpu);
628                 WARN_ON(rc);
629                 if (rc)
630                         return -EOPNOTSUPP;
631
632                 if (!cb->qsi.as) {
633                         printk(KERN_INFO "hwsampler: CPUMF sampling is not authorized.\n");
634                         return -EINVAL;
635                 }
636
637                 if (cb->qsi.es) {
638                         printk(KERN_WARNING "hwsampler: CPUMF is still enabled.\n");
639                         rc = smp_ctl_ssctl_stop(cpu);
640                         if (rc)
641                                 return -EINVAL;
642
643                         printk(KERN_INFO
644                                 "CPU %d, CPUMF Sampling stopped now.\n", cpu);
645                 }
646         }
647         return 0;
648 }
649
650 static int check_qsi_on_start(void)
651 {
652         unsigned int cpu;
653         int rc;
654         struct hws_cpu_buffer *cb;
655
656         for_each_online_cpu(cpu) {
657                 cb = &per_cpu(sampler_cpu_buffer, cpu);
658                 rc = smp_ctl_qsi(cpu);
659                 WARN_ON(rc);
660
661                 if (!cb->qsi.as)
662                         return -EINVAL;
663
664                 if (cb->qsi.es)
665                         return -EINVAL;
666
667                 if (cb->qsi.cs)
668                         return -EINVAL;
669         }
670         return 0;
671 }
672
673 static void worker_on_start(unsigned int cpu)
674 {
675         struct hws_cpu_buffer *cb;
676
677         cb = &per_cpu(sampler_cpu_buffer, cpu);
678         cb->worker_entry = cb->first_sdbt;
679 }
680
681 static int worker_check_error(unsigned int cpu, int ext_params)
682 {
683         int rc;
684         unsigned long *sdbt;
685         struct hws_cpu_buffer *cb;
686
687         rc = 0;
688         cb = &per_cpu(sampler_cpu_buffer, cpu);
689         sdbt = (unsigned long *) cb->worker_entry;
690
691         if (!sdbt || !*sdbt)
692                 return -EINVAL;
693
694         if (ext_params & CPU_MF_INT_SF_PRA)
695                 cb->req_alert++;
696
697         if (ext_params & CPU_MF_INT_SF_LSDA)
698                 cb->loss_of_sample_data++;
699
700         if (ext_params & CPU_MF_INT_SF_IAE) {
701                 cb->invalid_entry_address++;
702                 rc = -EINVAL;
703         }
704
705         if (ext_params & CPU_MF_INT_SF_ISE) {
706                 cb->incorrect_sdbt_entry++;
707                 rc = -EINVAL;
708         }
709
710         if (ext_params & CPU_MF_INT_SF_SACA) {
711                 cb->sample_auth_change_alert++;
712                 rc = -EINVAL;
713         }
714
715         return rc;
716 }
717
718 static void worker_on_finish(unsigned int cpu)
719 {
720         int rc, i;
721         struct hws_cpu_buffer *cb;
722
723         cb = &per_cpu(sampler_cpu_buffer, cpu);
724
725         if (cb->finish) {
726                 rc = smp_ctl_qsi(cpu);
727                 WARN_ON(rc);
728                 if (cb->qsi.es) {
729                         printk(KERN_INFO
730                                 "hwsampler: CPU %d, CPUMF Stop/Deactivate sampling.\n",
731                                 cpu);
732                         rc = smp_ctl_ssctl_stop(cpu);
733                         if (rc)
734                                 printk(KERN_INFO
735                                         "hwsampler: CPU %d, CPUMF Deactivation failed.\n",
736                                         cpu);
737
738                         for_each_online_cpu(i) {
739                                 if (i == cpu)
740                                         continue;
741                                 if (!cb->finish) {
742                                         cb->finish = 1;
743                                         queue_work_on(i, hws_wq,
744                                                 &cb->worker);
745                                 }
746                         }
747                 }
748         }
749 }
750
751 static void worker_on_interrupt(unsigned int cpu)
752 {
753         unsigned long *sdbt;
754         unsigned char done;
755         struct hws_cpu_buffer *cb;
756
757         cb = &per_cpu(sampler_cpu_buffer, cpu);
758
759         sdbt = (unsigned long *) cb->worker_entry;
760
761         done = 0;
762         /* do not proceed if stop was entered,
763          * forget the buffers not yet processed */
764         while (!done && !cb->stop_mode) {
765                 unsigned long *trailer;
766                 struct hws_trailer_entry *te;
767                 unsigned long *dear = 0;
768
769                 trailer = trailer_entry_ptr(*sdbt);
770                 /* leave loop if no more work to do */
771                 if (!(*trailer & SDB_TE_BUFFER_FULL_MASK)) {
772                         done = 1;
773                         if (!hws_flush_all)
774                                 continue;
775                 }
776
777                 te = (struct hws_trailer_entry *)trailer;
778                 cb->sample_overflow += te->overflow;
779
780                 add_samples_to_oprofile(cpu, sdbt, dear);
781
782                 /* reset trailer */
783                 xchg((unsigned char *) te, 0x40);
784
785                 /* advance to next sdb slot in current sdbt */
786                 sdbt++;
787                 /* in case link bit is set use address w/o link bit */
788                 if (is_link_entry(sdbt))
789                         sdbt = get_next_sdbt(sdbt);
790
791                 cb->worker_entry = (unsigned long)sdbt;
792         }
793 }
794
795 static void add_samples_to_oprofile(unsigned int cpu, unsigned long *sdbt,
796                 unsigned long *dear)
797 {
798         struct hws_basic_entry *sample_data_ptr;
799         unsigned long *trailer;
800
801         trailer = trailer_entry_ptr(*sdbt);
802         if (dear) {
803                 if (dear > trailer)
804                         return;
805                 trailer = dear;
806         }
807
808         sample_data_ptr = (struct hws_basic_entry *)(*sdbt);
809
810         while ((unsigned long *)sample_data_ptr < trailer) {
811                 struct pt_regs *regs = NULL;
812                 struct task_struct *tsk = NULL;
813
814                 /*
815                  * Check sampling mode, 1 indicates basic (=customer) sampling
816                  * mode.
817                  */
818                 if (sample_data_ptr->def != 1) {
819                         /* sample slot is not yet written */
820                         break;
821                 } else {
822                         /* make sure we don't use it twice,
823                          * the next time the sampler will set it again */
824                         sample_data_ptr->def = 0;
825                 }
826
827                 /* Get pt_regs. */
828                 if (sample_data_ptr->P == 1) {
829                         /* userspace sample */
830                         unsigned int pid = sample_data_ptr->prim_asn;
831                         if (!counter_config.user)
832                                 goto skip_sample;
833                         rcu_read_lock();
834                         tsk = pid_task(find_vpid(pid), PIDTYPE_PID);
835                         if (tsk)
836                                 regs = task_pt_regs(tsk);
837                         rcu_read_unlock();
838                 } else {
839                         /* kernelspace sample */
840                         if (!counter_config.kernel)
841                                 goto skip_sample;
842                         regs = task_pt_regs(current);
843                 }
844
845                 mutex_lock(&hws_sem);
846                 oprofile_add_ext_hw_sample(sample_data_ptr->ia, regs, 0,
847                                 !sample_data_ptr->P, tsk);
848                 mutex_unlock(&hws_sem);
849         skip_sample:
850                 sample_data_ptr++;
851         }
852 }
853
854 static void worker(struct work_struct *work)
855 {
856         unsigned int cpu;
857         int ext_params;
858         struct hws_cpu_buffer *cb;
859
860         cb = container_of(work, struct hws_cpu_buffer, worker);
861         cpu = smp_processor_id();
862         ext_params = atomic_xchg(&cb->ext_params, 0);
863
864         if (!cb->worker_entry)
865                 worker_on_start(cpu);
866
867         if (worker_check_error(cpu, ext_params))
868                 return;
869
870         if (!cb->finish)
871                 worker_on_interrupt(cpu);
872
873         if (cb->finish)
874                 worker_on_finish(cpu);
875 }
876
877 /**
878  * hwsampler_allocate() - allocate memory for the hardware sampler
879  * @sdbt:  number of SDBTs per online CPU (must be > 0)
880  * @sdb:   number of SDBs per SDBT (minimum 1, maximum 511)
881  *
882  * Returns 0 on success, !0 on failure.
883  */
884 int hwsampler_allocate(unsigned long sdbt, unsigned long sdb)
885 {
886         int cpu, rc;
887         mutex_lock(&hws_sem);
888
889         rc = -EINVAL;
890         if (hws_state != HWS_DEALLOCATED)
891                 goto allocate_exit;
892
893         if (sdbt < 1)
894                 goto allocate_exit;
895
896         if (sdb > MAX_NUM_SDB || sdb < MIN_NUM_SDB)
897                 goto allocate_exit;
898
899         num_sdbt = sdbt;
900         num_sdb = sdb;
901
902         oom_killer_was_active = 0;
903         register_oom_notifier(&hws_oom_notifier);
904
905         for_each_online_cpu(cpu) {
906                 if (allocate_sdbt(cpu)) {
907                         unregister_oom_notifier(&hws_oom_notifier);
908                         goto allocate_error;
909                 }
910         }
911         unregister_oom_notifier(&hws_oom_notifier);
912         if (oom_killer_was_active)
913                 goto allocate_error;
914
915         hws_state = HWS_STOPPED;
916         rc = 0;
917
918 allocate_exit:
919         mutex_unlock(&hws_sem);
920         return rc;
921
922 allocate_error:
923         rc = -ENOMEM;
924         printk(KERN_ERR "hwsampler: CPUMF Memory allocation failed.\n");
925         goto allocate_exit;
926 }
927
928 /**
929  * hwsampler_deallocate() - deallocate hardware sampler memory
930  *
931  * Returns 0 on success, !0 on failure.
932  */
933 int hwsampler_deallocate(void)
934 {
935         int rc;
936
937         mutex_lock(&hws_sem);
938
939         rc = -EINVAL;
940         if (hws_state != HWS_STOPPED)
941                 goto deallocate_exit;
942
943         irq_subclass_unregister(IRQ_SUBCLASS_MEASUREMENT_ALERT);
944         hws_alert = 0;
945         deallocate_sdbt();
946
947         hws_state = HWS_DEALLOCATED;
948         rc = 0;
949
950 deallocate_exit:
951         mutex_unlock(&hws_sem);
952
953         return rc;
954 }
955
956 unsigned long hwsampler_query_min_interval(void)
957 {
958         return min_sampler_rate;
959 }
960
961 unsigned long hwsampler_query_max_interval(void)
962 {
963         return max_sampler_rate;
964 }
965
966 unsigned long hwsampler_get_sample_overflow_count(unsigned int cpu)
967 {
968         struct hws_cpu_buffer *cb;
969
970         cb = &per_cpu(sampler_cpu_buffer, cpu);
971
972         return cb->sample_overflow;
973 }
974
975 int hwsampler_setup(void)
976 {
977         int rc;
978         int cpu;
979         struct hws_cpu_buffer *cb;
980
981         mutex_lock(&hws_sem);
982
983         rc = -EINVAL;
984         if (hws_state)
985                 goto setup_exit;
986
987         hws_state = HWS_INIT;
988
989         init_all_cpu_buffers();
990
991         rc = check_hardware_prerequisites();
992         if (rc)
993                 goto setup_exit;
994
995         rc = check_qsi_on_setup();
996         if (rc)
997                 goto setup_exit;
998
999         rc = -EINVAL;
1000         hws_wq = create_workqueue("hwsampler");
1001         if (!hws_wq)
1002                 goto setup_exit;
1003
1004         register_cpu_notifier(&hws_cpu_notifier);
1005
1006         for_each_online_cpu(cpu) {
1007                 cb = &per_cpu(sampler_cpu_buffer, cpu);
1008                 INIT_WORK(&cb->worker, worker);
1009                 rc = smp_ctl_qsi(cpu);
1010                 WARN_ON(rc);
1011                 if (min_sampler_rate != cb->qsi.min_sampl_rate) {
1012                         if (min_sampler_rate) {
1013                                 printk(KERN_WARNING
1014                                         "hwsampler: different min sampler rate values.\n");
1015                                 if (min_sampler_rate < cb->qsi.min_sampl_rate)
1016                                         min_sampler_rate =
1017                                                 cb->qsi.min_sampl_rate;
1018                         } else
1019                                 min_sampler_rate = cb->qsi.min_sampl_rate;
1020                 }
1021                 if (max_sampler_rate != cb->qsi.max_sampl_rate) {
1022                         if (max_sampler_rate) {
1023                                 printk(KERN_WARNING
1024                                         "hwsampler: different max sampler rate values.\n");
1025                                 if (max_sampler_rate > cb->qsi.max_sampl_rate)
1026                                         max_sampler_rate =
1027                                                 cb->qsi.max_sampl_rate;
1028                         } else
1029                                 max_sampler_rate = cb->qsi.max_sampl_rate;
1030                 }
1031         }
1032         register_external_irq(EXT_IRQ_MEASURE_ALERT, hws_ext_handler);
1033
1034         hws_state = HWS_DEALLOCATED;
1035         rc = 0;
1036
1037 setup_exit:
1038         mutex_unlock(&hws_sem);
1039         return rc;
1040 }
1041
1042 int hwsampler_shutdown(void)
1043 {
1044         int rc;
1045
1046         mutex_lock(&hws_sem);
1047
1048         rc = -EINVAL;
1049         if (hws_state == HWS_DEALLOCATED || hws_state == HWS_STOPPED) {
1050                 mutex_unlock(&hws_sem);
1051
1052                 if (hws_wq)
1053                         flush_workqueue(hws_wq);
1054
1055                 mutex_lock(&hws_sem);
1056
1057                 if (hws_state == HWS_STOPPED) {
1058                         irq_subclass_unregister(IRQ_SUBCLASS_MEASUREMENT_ALERT);
1059                         hws_alert = 0;
1060                         deallocate_sdbt();
1061                 }
1062                 if (hws_wq) {
1063                         destroy_workqueue(hws_wq);
1064                         hws_wq = NULL;
1065                 }
1066
1067                 unregister_external_irq(EXT_IRQ_MEASURE_ALERT, hws_ext_handler);
1068                 hws_state = HWS_INIT;
1069                 rc = 0;
1070         }
1071         mutex_unlock(&hws_sem);
1072
1073         unregister_cpu_notifier(&hws_cpu_notifier);
1074
1075         return rc;
1076 }
1077
1078 /**
1079  * hwsampler_start_all() - start hardware sampling on all online CPUs
1080  * @rate:  specifies the used interval when samples are taken
1081  *
1082  * Returns 0 on success, !0 on failure.
1083  */
1084 int hwsampler_start_all(unsigned long rate)
1085 {
1086         int rc, cpu;
1087
1088         mutex_lock(&hws_sem);
1089
1090         hws_oom = 0;
1091
1092         rc = -EINVAL;
1093         if (hws_state != HWS_STOPPED)
1094                 goto start_all_exit;
1095
1096         interval = rate;
1097
1098         /* fail if rate is not valid */
1099         if (interval < min_sampler_rate || interval > max_sampler_rate)
1100                 goto start_all_exit;
1101
1102         rc = check_qsi_on_start();
1103         if (rc)
1104                 goto start_all_exit;
1105
1106         prepare_cpu_buffers();
1107
1108         for_each_online_cpu(cpu) {
1109                 rc = start_sampling(cpu);
1110                 if (rc)
1111                         break;
1112         }
1113         if (rc) {
1114                 for_each_online_cpu(cpu) {
1115                         stop_sampling(cpu);
1116                 }
1117                 goto start_all_exit;
1118         }
1119         hws_state = HWS_STARTED;
1120         rc = 0;
1121
1122 start_all_exit:
1123         mutex_unlock(&hws_sem);
1124
1125         if (rc)
1126                 return rc;
1127
1128         register_oom_notifier(&hws_oom_notifier);
1129         hws_oom = 1;
1130         hws_flush_all = 0;
1131         /* now let them in, 1407 CPUMF external interrupts */
1132         hws_alert = 1;
1133         irq_subclass_register(IRQ_SUBCLASS_MEASUREMENT_ALERT);
1134
1135         return 0;
1136 }
1137
1138 /**
1139  * hwsampler_stop_all() - stop hardware sampling on all online CPUs
1140  *
1141  * Returns 0 on success, !0 on failure.
1142  */
1143 int hwsampler_stop_all(void)
1144 {
1145         int tmp_rc, rc, cpu;
1146         struct hws_cpu_buffer *cb;
1147
1148         mutex_lock(&hws_sem);
1149
1150         rc = 0;
1151         if (hws_state == HWS_INIT) {
1152                 mutex_unlock(&hws_sem);
1153                 return 0;
1154         }
1155         hws_state = HWS_STOPPING;
1156         mutex_unlock(&hws_sem);
1157
1158         for_each_online_cpu(cpu) {
1159                 cb = &per_cpu(sampler_cpu_buffer, cpu);
1160                 cb->stop_mode = 1;
1161                 tmp_rc = stop_sampling(cpu);
1162                 if (tmp_rc)
1163                         rc = tmp_rc;
1164         }
1165
1166         if (hws_wq)
1167                 flush_workqueue(hws_wq);
1168
1169         mutex_lock(&hws_sem);
1170         if (hws_oom) {
1171                 unregister_oom_notifier(&hws_oom_notifier);
1172                 hws_oom = 0;
1173         }
1174         hws_state = HWS_STOPPED;
1175         mutex_unlock(&hws_sem);
1176
1177         return rc;
1178 }