pcr.c (7991B)
1// SPDX-License-Identifier: GPL-2.0-only 2/* pcr.c: Generic sparc64 performance counter infrastructure. 3 * 4 * Copyright (C) 2009 David S. Miller (davem@davemloft.net) 5 */ 6#include <linux/kernel.h> 7#include <linux/export.h> 8#include <linux/init.h> 9#include <linux/irq.h> 10 11#include <linux/irq_work.h> 12#include <linux/ftrace.h> 13 14#include <asm/pil.h> 15#include <asm/pcr.h> 16#include <asm/nmi.h> 17#include <asm/asi.h> 18#include <asm/spitfire.h> 19 20/* This code is shared between various users of the performance 21 * counters. Users will be oprofile, pseudo-NMI watchdog, and the 22 * perf_event support layer. 23 */ 24 25/* Performance counter interrupts run unmasked at PIL level 15. 26 * Therefore we can't do things like wakeups and other work 27 * that expects IRQ disabling to be adhered to in locking etc. 28 * 29 * Therefore in such situations we defer the work by signalling 30 * a lower level cpu IRQ. 31 */ 32void __irq_entry deferred_pcr_work_irq(int irq, struct pt_regs *regs) 33{ 34 struct pt_regs *old_regs; 35 36 clear_softint(1 << PIL_DEFERRED_PCR_WORK); 37 38 old_regs = set_irq_regs(regs); 39 irq_enter(); 40#ifdef CONFIG_IRQ_WORK 41 irq_work_run(); 42#endif 43 irq_exit(); 44 set_irq_regs(old_regs); 45} 46 47void arch_irq_work_raise(void) 48{ 49 set_softint(1 << PIL_DEFERRED_PCR_WORK); 50} 51 52const struct pcr_ops *pcr_ops; 53EXPORT_SYMBOL_GPL(pcr_ops); 54 55static u64 direct_pcr_read(unsigned long reg_num) 56{ 57 u64 val; 58 59 WARN_ON_ONCE(reg_num != 0); 60 __asm__ __volatile__("rd %%pcr, %0" : "=r" (val)); 61 return val; 62} 63 64static void direct_pcr_write(unsigned long reg_num, u64 val) 65{ 66 WARN_ON_ONCE(reg_num != 0); 67 __asm__ __volatile__("wr %0, 0x0, %%pcr" : : "r" (val)); 68} 69 70static u64 direct_pic_read(unsigned long reg_num) 71{ 72 u64 val; 73 74 WARN_ON_ONCE(reg_num != 0); 75 __asm__ __volatile__("rd %%pic, %0" : "=r" (val)); 76 return val; 77} 78 79static void direct_pic_write(unsigned long reg_num, u64 val) 80{ 81 WARN_ON_ONCE(reg_num != 0); 82 83 /* Blackbird errata workaround. See commentary in 84 * arch/sparc64/kernel/smp.c:smp_percpu_timer_interrupt() 85 * for more information. 86 */ 87 __asm__ __volatile__("ba,pt %%xcc, 99f\n\t" 88 " nop\n\t" 89 ".align 64\n" 90 "99:wr %0, 0x0, %%pic\n\t" 91 "rd %%pic, %%g0" : : "r" (val)); 92} 93 94static u64 direct_picl_value(unsigned int nmi_hz) 95{ 96 u32 delta = local_cpu_data().clock_tick / nmi_hz; 97 98 return ((u64)((0 - delta) & 0xffffffff)) << 32; 99} 100 101static const struct pcr_ops direct_pcr_ops = { 102 .read_pcr = direct_pcr_read, 103 .write_pcr = direct_pcr_write, 104 .read_pic = direct_pic_read, 105 .write_pic = direct_pic_write, 106 .nmi_picl_value = direct_picl_value, 107 .pcr_nmi_enable = (PCR_PIC_PRIV | PCR_STRACE | PCR_UTRACE), 108 .pcr_nmi_disable = PCR_PIC_PRIV, 109}; 110 111static void n2_pcr_write(unsigned long reg_num, u64 val) 112{ 113 unsigned long ret; 114 115 WARN_ON_ONCE(reg_num != 0); 116 if (val & PCR_N2_HTRACE) { 117 ret = sun4v_niagara2_setperf(HV_N2_PERF_SPARC_CTL, val); 118 if (ret != HV_EOK) 119 direct_pcr_write(reg_num, val); 120 } else 121 direct_pcr_write(reg_num, val); 122} 123 124static u64 n2_picl_value(unsigned int nmi_hz) 125{ 126 u32 delta = local_cpu_data().clock_tick / (nmi_hz << 2); 127 128 return ((u64)((0 - delta) & 0xffffffff)) << 32; 129} 130 131static const struct pcr_ops n2_pcr_ops = { 132 .read_pcr = direct_pcr_read, 133 .write_pcr = n2_pcr_write, 134 .read_pic = direct_pic_read, 135 .write_pic = direct_pic_write, 136 .nmi_picl_value = n2_picl_value, 137 .pcr_nmi_enable = (PCR_PIC_PRIV | PCR_STRACE | PCR_UTRACE | 138 PCR_N2_TOE_OV1 | 139 (2 << PCR_N2_SL1_SHIFT) | 140 (0xff << PCR_N2_MASK1_SHIFT)), 141 .pcr_nmi_disable = PCR_PIC_PRIV, 142}; 143 144static u64 n4_pcr_read(unsigned long reg_num) 145{ 146 unsigned long val; 147 148 (void) sun4v_vt_get_perfreg(reg_num, &val); 149 150 return val; 151} 152 153static void n4_pcr_write(unsigned long reg_num, u64 val) 154{ 155 (void) sun4v_vt_set_perfreg(reg_num, val); 156} 157 158static u64 n4_pic_read(unsigned long reg_num) 159{ 160 unsigned long val; 161 162 __asm__ __volatile__("ldxa [%1] %2, %0" 163 : "=r" (val) 164 : "r" (reg_num * 0x8UL), "i" (ASI_PIC)); 165 166 return val; 167} 168 169static void n4_pic_write(unsigned long reg_num, u64 val) 170{ 171 __asm__ __volatile__("stxa %0, [%1] %2" 172 : /* no outputs */ 173 : "r" (val), "r" (reg_num * 0x8UL), "i" (ASI_PIC)); 174} 175 176static u64 n4_picl_value(unsigned int nmi_hz) 177{ 178 u32 delta = local_cpu_data().clock_tick / (nmi_hz << 2); 179 180 return ((u64)((0 - delta) & 0xffffffff)); 181} 182 183static const struct pcr_ops n4_pcr_ops = { 184 .read_pcr = n4_pcr_read, 185 .write_pcr = n4_pcr_write, 186 .read_pic = n4_pic_read, 187 .write_pic = n4_pic_write, 188 .nmi_picl_value = n4_picl_value, 189 .pcr_nmi_enable = (PCR_N4_PICNPT | PCR_N4_STRACE | 190 PCR_N4_UTRACE | PCR_N4_TOE | 191 (26 << PCR_N4_SL_SHIFT)), 192 .pcr_nmi_disable = PCR_N4_PICNPT, 193}; 194 195static u64 n5_pcr_read(unsigned long reg_num) 196{ 197 unsigned long val; 198 199 (void) sun4v_t5_get_perfreg(reg_num, &val); 200 201 return val; 202} 203 204static void n5_pcr_write(unsigned long reg_num, u64 val) 205{ 206 (void) sun4v_t5_set_perfreg(reg_num, val); 207} 208 209static const struct pcr_ops n5_pcr_ops = { 210 .read_pcr = n5_pcr_read, 211 .write_pcr = n5_pcr_write, 212 .read_pic = n4_pic_read, 213 .write_pic = n4_pic_write, 214 .nmi_picl_value = n4_picl_value, 215 .pcr_nmi_enable = (PCR_N4_PICNPT | PCR_N4_STRACE | 216 PCR_N4_UTRACE | PCR_N4_TOE | 217 (26 << PCR_N4_SL_SHIFT)), 218 .pcr_nmi_disable = PCR_N4_PICNPT, 219}; 220 221static u64 m7_pcr_read(unsigned long reg_num) 222{ 223 unsigned long val; 224 225 (void) sun4v_m7_get_perfreg(reg_num, &val); 226 227 return val; 228} 229 230static void m7_pcr_write(unsigned long reg_num, u64 val) 231{ 232 (void) sun4v_m7_set_perfreg(reg_num, val); 233} 234 235static const struct pcr_ops m7_pcr_ops = { 236 .read_pcr = m7_pcr_read, 237 .write_pcr = m7_pcr_write, 238 .read_pic = n4_pic_read, 239 .write_pic = n4_pic_write, 240 .nmi_picl_value = n4_picl_value, 241 .pcr_nmi_enable = (PCR_N4_PICNPT | PCR_N4_STRACE | 242 PCR_N4_UTRACE | PCR_N4_TOE | 243 (26 << PCR_N4_SL_SHIFT)), 244 .pcr_nmi_disable = PCR_N4_PICNPT, 245}; 246 247static unsigned long perf_hsvc_group; 248static unsigned long perf_hsvc_major; 249static unsigned long perf_hsvc_minor; 250 251static int __init register_perf_hsvc(void) 252{ 253 unsigned long hverror; 254 255 if (tlb_type == hypervisor) { 256 switch (sun4v_chip_type) { 257 case SUN4V_CHIP_NIAGARA1: 258 perf_hsvc_group = HV_GRP_NIAG_PERF; 259 break; 260 261 case SUN4V_CHIP_NIAGARA2: 262 perf_hsvc_group = HV_GRP_N2_CPU; 263 break; 264 265 case SUN4V_CHIP_NIAGARA3: 266 perf_hsvc_group = HV_GRP_KT_CPU; 267 break; 268 269 case SUN4V_CHIP_NIAGARA4: 270 perf_hsvc_group = HV_GRP_VT_CPU; 271 break; 272 273 case SUN4V_CHIP_NIAGARA5: 274 perf_hsvc_group = HV_GRP_T5_CPU; 275 break; 276 277 case SUN4V_CHIP_SPARC_M7: 278 perf_hsvc_group = HV_GRP_M7_PERF; 279 break; 280 281 default: 282 return -ENODEV; 283 } 284 285 286 perf_hsvc_major = 1; 287 perf_hsvc_minor = 0; 288 hverror = sun4v_hvapi_register(perf_hsvc_group, 289 perf_hsvc_major, 290 &perf_hsvc_minor); 291 if (hverror) { 292 pr_err("perfmon: Could not register hvapi(0x%lx).\n", 293 hverror); 294 return -ENODEV; 295 } 296 } 297 return 0; 298} 299 300static void __init unregister_perf_hsvc(void) 301{ 302 if (tlb_type != hypervisor) 303 return; 304 sun4v_hvapi_unregister(perf_hsvc_group); 305} 306 307static int __init setup_sun4v_pcr_ops(void) 308{ 309 int ret = 0; 310 311 switch (sun4v_chip_type) { 312 case SUN4V_CHIP_NIAGARA1: 313 case SUN4V_CHIP_NIAGARA2: 314 case SUN4V_CHIP_NIAGARA3: 315 pcr_ops = &n2_pcr_ops; 316 break; 317 318 case SUN4V_CHIP_NIAGARA4: 319 pcr_ops = &n4_pcr_ops; 320 break; 321 322 case SUN4V_CHIP_NIAGARA5: 323 pcr_ops = &n5_pcr_ops; 324 break; 325 326 case SUN4V_CHIP_SPARC_M7: 327 pcr_ops = &m7_pcr_ops; 328 break; 329 330 default: 331 ret = -ENODEV; 332 break; 333 } 334 335 return ret; 336} 337 338int __init pcr_arch_init(void) 339{ 340 int err = register_perf_hsvc(); 341 342 if (err) 343 return err; 344 345 switch (tlb_type) { 346 case hypervisor: 347 err = setup_sun4v_pcr_ops(); 348 if (err) 349 goto out_unregister; 350 break; 351 352 case cheetah: 353 case cheetah_plus: 354 pcr_ops = &direct_pcr_ops; 355 break; 356 357 case spitfire: 358 /* UltraSPARC-I/II and derivatives lack a profile 359 * counter overflow interrupt so we can't make use of 360 * their hardware currently. 361 */ 362 fallthrough; 363 default: 364 err = -ENODEV; 365 goto out_unregister; 366 } 367 368 return nmi_init(); 369 370out_unregister: 371 unregister_perf_hsvc(); 372 return err; 373}