1 /* pcr.c: Generic sparc64 performance counter infrastructure.
3 * Copyright (C) 2009 David S. Miller (davem@davemloft.net)
5 #include <linux/kernel.h>
6 #include <linux/export.h>
7 #include <linux/init.h>
10 #include <linux/irq_work.h>
11 #include <linux/ftrace.h>
17 #include <asm/spitfire.h>
19 /* This code is shared between various users of the performance
20 * counters. Users will be oprofile, pseudo-NMI watchdog, and the
21 * perf_event support layer.
24 /* Performance counter interrupts run unmasked at PIL level 15.
25 * Therefore we can't do things like wakeups and other work
26 * that expects IRQ disabling to be adhered to in locking etc.
28 * Therefore in such situations we defer the work by signalling
29 * a lower level cpu IRQ.
31 void __irq_entry deferred_pcr_work_irq(int irq, struct pt_regs *regs)
33 struct pt_regs *old_regs;
35 clear_softint(1 << PIL_DEFERRED_PCR_WORK);
37 old_regs = set_irq_regs(regs);
39 #ifdef CONFIG_IRQ_WORK
43 set_irq_regs(old_regs);
46 void arch_irq_work_raise(void)
48 set_softint(1 << PIL_DEFERRED_PCR_WORK);
51 const struct pcr_ops *pcr_ops;
52 EXPORT_SYMBOL_GPL(pcr_ops);
54 static u64 direct_pcr_read(unsigned long reg_num)
58 WARN_ON_ONCE(reg_num != 0);
59 __asm__ __volatile__("rd %%pcr, %0" : "=r" (val));
63 static void direct_pcr_write(unsigned long reg_num, u64 val)
65 WARN_ON_ONCE(reg_num != 0);
66 __asm__ __volatile__("wr %0, 0x0, %%pcr" : : "r" (val));
69 static u64 direct_pic_read(unsigned long reg_num)
73 WARN_ON_ONCE(reg_num != 0);
74 __asm__ __volatile__("rd %%pic, %0" : "=r" (val));
78 static void direct_pic_write(unsigned long reg_num, u64 val)
80 WARN_ON_ONCE(reg_num != 0);
82 /* Blackbird errata workaround. See commentary in
83 * arch/sparc64/kernel/smp.c:smp_percpu_timer_interrupt()
84 * for more information.
86 __asm__ __volatile__("ba,pt %%xcc, 99f\n\t"
89 "99:wr %0, 0x0, %%pic\n\t"
90 "rd %%pic, %%g0" : : "r" (val));
93 static u64 direct_picl_value(unsigned int nmi_hz)
95 u32 delta = local_cpu_data().clock_tick / nmi_hz;
97 return ((u64)((0 - delta) & 0xffffffff)) << 32;
100 static const struct pcr_ops direct_pcr_ops = {
101 .read_pcr = direct_pcr_read,
102 .write_pcr = direct_pcr_write,
103 .read_pic = direct_pic_read,
104 .write_pic = direct_pic_write,
105 .nmi_picl_value = direct_picl_value,
106 .pcr_nmi_enable = (PCR_PIC_PRIV | PCR_STRACE | PCR_UTRACE),
107 .pcr_nmi_disable = PCR_PIC_PRIV,
110 static void n2_pcr_write(unsigned long reg_num, u64 val)
114 WARN_ON_ONCE(reg_num != 0);
115 if (val & PCR_N2_HTRACE) {
116 ret = sun4v_niagara2_setperf(HV_N2_PERF_SPARC_CTL, val);
118 direct_pcr_write(reg_num, val);
120 direct_pcr_write(reg_num, val);
123 static u64 n2_picl_value(unsigned int nmi_hz)
125 u32 delta = local_cpu_data().clock_tick / (nmi_hz << 2);
127 return ((u64)((0 - delta) & 0xffffffff)) << 32;
130 static const struct pcr_ops n2_pcr_ops = {
131 .read_pcr = direct_pcr_read,
132 .write_pcr = n2_pcr_write,
133 .read_pic = direct_pic_read,
134 .write_pic = direct_pic_write,
135 .nmi_picl_value = n2_picl_value,
136 .pcr_nmi_enable = (PCR_PIC_PRIV | PCR_STRACE | PCR_UTRACE |
138 (2 << PCR_N2_SL1_SHIFT) |
139 (0xff << PCR_N2_MASK1_SHIFT)),
140 .pcr_nmi_disable = PCR_PIC_PRIV,
143 static u64 n4_pcr_read(unsigned long reg_num)
147 (void) sun4v_vt_get_perfreg(reg_num, &val);
152 static void n4_pcr_write(unsigned long reg_num, u64 val)
154 (void) sun4v_vt_set_perfreg(reg_num, val);
157 static u64 n4_pic_read(unsigned long reg_num)
161 __asm__ __volatile__("ldxa [%1] %2, %0"
163 : "r" (reg_num * 0x8UL), "i" (ASI_PIC));
168 static void n4_pic_write(unsigned long reg_num, u64 val)
170 __asm__ __volatile__("stxa %0, [%1] %2"
172 : "r" (val), "r" (reg_num * 0x8UL), "i" (ASI_PIC));
175 static u64 n4_picl_value(unsigned int nmi_hz)
177 u32 delta = local_cpu_data().clock_tick / (nmi_hz << 2);
179 return ((u64)((0 - delta) & 0xffffffff));
182 static const struct pcr_ops n4_pcr_ops = {
183 .read_pcr = n4_pcr_read,
184 .write_pcr = n4_pcr_write,
185 .read_pic = n4_pic_read,
186 .write_pic = n4_pic_write,
187 .nmi_picl_value = n4_picl_value,
188 .pcr_nmi_enable = (PCR_N4_PICNPT | PCR_N4_STRACE |
189 PCR_N4_UTRACE | PCR_N4_TOE |
190 (26 << PCR_N4_SL_SHIFT)),
191 .pcr_nmi_disable = PCR_N4_PICNPT,
194 static unsigned long perf_hsvc_group;
195 static unsigned long perf_hsvc_major;
196 static unsigned long perf_hsvc_minor;
198 static int __init register_perf_hsvc(void)
200 if (tlb_type == hypervisor) {
201 switch (sun4v_chip_type) {
202 case SUN4V_CHIP_NIAGARA1:
203 perf_hsvc_group = HV_GRP_NIAG_PERF;
206 case SUN4V_CHIP_NIAGARA2:
207 perf_hsvc_group = HV_GRP_N2_CPU;
210 case SUN4V_CHIP_NIAGARA3:
211 perf_hsvc_group = HV_GRP_KT_CPU;
214 case SUN4V_CHIP_NIAGARA4:
215 perf_hsvc_group = HV_GRP_VT_CPU;
225 if (sun4v_hvapi_register(perf_hsvc_group,
228 printk("perfmon: Could not register hvapi.\n");
235 static void __init unregister_perf_hsvc(void)
237 if (tlb_type != hypervisor)
239 sun4v_hvapi_unregister(perf_hsvc_group);
242 static int __init setup_sun4v_pcr_ops(void)
246 switch (sun4v_chip_type) {
247 case SUN4V_CHIP_NIAGARA1:
248 case SUN4V_CHIP_NIAGARA2:
249 case SUN4V_CHIP_NIAGARA3:
250 pcr_ops = &n2_pcr_ops;
253 case SUN4V_CHIP_NIAGARA4:
254 pcr_ops = &n4_pcr_ops;
265 int __init pcr_arch_init(void)
267 int err = register_perf_hsvc();
274 err = setup_sun4v_pcr_ops();
281 pcr_ops = &direct_pcr_ops;
285 /* UltraSPARC-I/II and derivatives lack a profile
286 * counter overflow interrupt so we can't make use of
287 * their hardware currently.
298 unregister_perf_hsvc();