bbc_envctrl.c (16271B)
1// SPDX-License-Identifier: GPL-2.0 2/* bbc_envctrl.c: UltraSPARC-III environment control driver. 3 * 4 * Copyright (C) 2001, 2008 David S. Miller (davem@davemloft.net) 5 */ 6 7#include <linux/kthread.h> 8#include <linux/delay.h> 9#include <linux/kmod.h> 10#include <linux/reboot.h> 11#include <linux/of.h> 12#include <linux/slab.h> 13#include <linux/of_device.h> 14#include <asm/oplib.h> 15 16#include "bbc_i2c.h" 17#include "max1617.h" 18 19#undef ENVCTRL_TRACE 20 21/* WARNING: Making changes to this driver is very dangerous. 22 * If you misprogram the sensor chips they can 23 * cut the power on you instantly. 24 */ 25 26/* Two temperature sensors exist in the SunBLADE-1000 enclosure. 27 * Both are implemented using max1617 i2c devices. Each max1617 28 * monitors 2 temperatures, one for one of the cpu dies and the other 29 * for the ambient temperature. 30 * 31 * The max1617 is capable of being programmed with power-off 32 * temperature values, one low limit and one high limit. These 33 * can be controlled independently for the cpu or ambient temperature. 34 * If a limit is violated, the power is simply shut off. The frequency 35 * with which the max1617 does temperature sampling can be controlled 36 * as well. 37 * 38 * Three fans exist inside the machine, all three are controlled with 39 * an i2c digital to analog converter. There is a fan directed at the 40 * two processor slots, another for the rest of the enclosure, and the 41 * third is for the power supply. The first two fans may be speed 42 * controlled by changing the voltage fed to them. The third fan may 43 * only be completely off or on. The third fan is meant to only be 44 * disabled/enabled when entering/exiting the lowest power-saving 45 * mode of the machine. 46 * 47 * An environmental control kernel thread periodically monitors all 48 * temperature sensors. Based upon the samples it will adjust the 49 * fan speeds to try and keep the system within a certain temperature 50 * range (the goal being to make the fans as quiet as possible without 51 * allowing the system to get too hot). 52 * 53 * If the temperature begins to rise/fall outside of the acceptable 54 * operating range, a periodic warning will be sent to the kernel log. 55 * The fans will be put on full blast to attempt to deal with this 56 * situation. After exceeding the acceptable operating range by a 57 * certain threshold, the kernel thread will shut down the system. 58 * Here, the thread is attempting to shut the machine down cleanly 59 * before the hardware based power-off event is triggered. 60 */ 61 62/* These settings are in Celsius. We use these defaults only 63 * if we cannot interrogate the cpu-fru SEEPROM. 64 */ 65struct temp_limits { 66 s8 high_pwroff, high_shutdown, high_warn; 67 s8 low_warn, low_shutdown, low_pwroff; 68}; 69 70static struct temp_limits cpu_temp_limits[2] = { 71 { 100, 85, 80, 5, -5, -10 }, 72 { 100, 85, 80, 5, -5, -10 }, 73}; 74 75static struct temp_limits amb_temp_limits[2] = { 76 { 65, 55, 40, 5, -5, -10 }, 77 { 65, 55, 40, 5, -5, -10 }, 78}; 79 80static LIST_HEAD(all_temps); 81static LIST_HEAD(all_fans); 82 83#define CPU_FAN_REG 0xf0 84#define SYS_FAN_REG 0xf2 85#define PSUPPLY_FAN_REG 0xf4 86 87#define FAN_SPEED_MIN 0x0c 88#define FAN_SPEED_MAX 0x3f 89 90#define PSUPPLY_FAN_ON 0x1f 91#define PSUPPLY_FAN_OFF 0x00 92 93static void set_fan_speeds(struct bbc_fan_control *fp) 94{ 95 /* Put temperatures into range so we don't mis-program 96 * the hardware. 97 */ 98 if (fp->cpu_fan_speed < FAN_SPEED_MIN) 99 fp->cpu_fan_speed = FAN_SPEED_MIN; 100 if (fp->cpu_fan_speed > FAN_SPEED_MAX) 101 fp->cpu_fan_speed = FAN_SPEED_MAX; 102 if (fp->system_fan_speed < FAN_SPEED_MIN) 103 fp->system_fan_speed = FAN_SPEED_MIN; 104 if (fp->system_fan_speed > FAN_SPEED_MAX) 105 fp->system_fan_speed = FAN_SPEED_MAX; 106#ifdef ENVCTRL_TRACE 107 printk("fan%d: Changed fan speed to cpu(%02x) sys(%02x)\n", 108 fp->index, 109 fp->cpu_fan_speed, fp->system_fan_speed); 110#endif 111 112 bbc_i2c_writeb(fp->client, fp->cpu_fan_speed, CPU_FAN_REG); 113 bbc_i2c_writeb(fp->client, fp->system_fan_speed, SYS_FAN_REG); 114 bbc_i2c_writeb(fp->client, 115 (fp->psupply_fan_on ? 116 PSUPPLY_FAN_ON : PSUPPLY_FAN_OFF), 117 PSUPPLY_FAN_REG); 118} 119 120static void get_current_temps(struct bbc_cpu_temperature *tp) 121{ 122 tp->prev_amb_temp = tp->curr_amb_temp; 123 bbc_i2c_readb(tp->client, 124 (unsigned char *) &tp->curr_amb_temp, 125 MAX1617_AMB_TEMP); 126 tp->prev_cpu_temp = tp->curr_cpu_temp; 127 bbc_i2c_readb(tp->client, 128 (unsigned char *) &tp->curr_cpu_temp, 129 MAX1617_CPU_TEMP); 130#ifdef ENVCTRL_TRACE 131 printk("temp%d: cpu(%d C) amb(%d C)\n", 132 tp->index, 133 (int) tp->curr_cpu_temp, (int) tp->curr_amb_temp); 134#endif 135} 136 137 138static void do_envctrl_shutdown(struct bbc_cpu_temperature *tp) 139{ 140 static int shutting_down = 0; 141 char *type = "???"; 142 s8 val = -1; 143 144 if (shutting_down != 0) 145 return; 146 147 if (tp->curr_amb_temp >= amb_temp_limits[tp->index].high_shutdown || 148 tp->curr_amb_temp < amb_temp_limits[tp->index].low_shutdown) { 149 type = "ambient"; 150 val = tp->curr_amb_temp; 151 } else if (tp->curr_cpu_temp >= cpu_temp_limits[tp->index].high_shutdown || 152 tp->curr_cpu_temp < cpu_temp_limits[tp->index].low_shutdown) { 153 type = "CPU"; 154 val = tp->curr_cpu_temp; 155 } 156 157 printk(KERN_CRIT "temp%d: Outside of safe %s " 158 "operating temperature, %d C.\n", 159 tp->index, type, val); 160 161 printk(KERN_CRIT "kenvctrld: Shutting down the system now.\n"); 162 163 shutting_down = 1; 164 orderly_poweroff(true); 165} 166 167#define WARN_INTERVAL (30 * HZ) 168 169static void analyze_ambient_temp(struct bbc_cpu_temperature *tp, unsigned long *last_warn, int tick) 170{ 171 int ret = 0; 172 173 if (time_after(jiffies, (*last_warn + WARN_INTERVAL))) { 174 if (tp->curr_amb_temp >= 175 amb_temp_limits[tp->index].high_warn) { 176 printk(KERN_WARNING "temp%d: " 177 "Above safe ambient operating temperature, %d C.\n", 178 tp->index, (int) tp->curr_amb_temp); 179 ret = 1; 180 } else if (tp->curr_amb_temp < 181 amb_temp_limits[tp->index].low_warn) { 182 printk(KERN_WARNING "temp%d: " 183 "Below safe ambient operating temperature, %d C.\n", 184 tp->index, (int) tp->curr_amb_temp); 185 ret = 1; 186 } 187 if (ret) 188 *last_warn = jiffies; 189 } else if (tp->curr_amb_temp >= amb_temp_limits[tp->index].high_warn || 190 tp->curr_amb_temp < amb_temp_limits[tp->index].low_warn) 191 ret = 1; 192 193 /* Now check the shutdown limits. */ 194 if (tp->curr_amb_temp >= amb_temp_limits[tp->index].high_shutdown || 195 tp->curr_amb_temp < amb_temp_limits[tp->index].low_shutdown) { 196 do_envctrl_shutdown(tp); 197 ret = 1; 198 } 199 200 if (ret) { 201 tp->fan_todo[FAN_AMBIENT] = FAN_FULLBLAST; 202 } else if ((tick & (8 - 1)) == 0) { 203 s8 amb_goal_hi = amb_temp_limits[tp->index].high_warn - 10; 204 s8 amb_goal_lo; 205 206 amb_goal_lo = amb_goal_hi - 3; 207 208 /* We do not try to avoid 'too cold' events. Basically we 209 * only try to deal with over-heating and fan noise reduction. 210 */ 211 if (tp->avg_amb_temp < amb_goal_hi) { 212 if (tp->avg_amb_temp >= amb_goal_lo) 213 tp->fan_todo[FAN_AMBIENT] = FAN_SAME; 214 else 215 tp->fan_todo[FAN_AMBIENT] = FAN_SLOWER; 216 } else { 217 tp->fan_todo[FAN_AMBIENT] = FAN_FASTER; 218 } 219 } else { 220 tp->fan_todo[FAN_AMBIENT] = FAN_SAME; 221 } 222} 223 224static void analyze_cpu_temp(struct bbc_cpu_temperature *tp, unsigned long *last_warn, int tick) 225{ 226 int ret = 0; 227 228 if (time_after(jiffies, (*last_warn + WARN_INTERVAL))) { 229 if (tp->curr_cpu_temp >= 230 cpu_temp_limits[tp->index].high_warn) { 231 printk(KERN_WARNING "temp%d: " 232 "Above safe CPU operating temperature, %d C.\n", 233 tp->index, (int) tp->curr_cpu_temp); 234 ret = 1; 235 } else if (tp->curr_cpu_temp < 236 cpu_temp_limits[tp->index].low_warn) { 237 printk(KERN_WARNING "temp%d: " 238 "Below safe CPU operating temperature, %d C.\n", 239 tp->index, (int) tp->curr_cpu_temp); 240 ret = 1; 241 } 242 if (ret) 243 *last_warn = jiffies; 244 } else if (tp->curr_cpu_temp >= cpu_temp_limits[tp->index].high_warn || 245 tp->curr_cpu_temp < cpu_temp_limits[tp->index].low_warn) 246 ret = 1; 247 248 /* Now check the shutdown limits. */ 249 if (tp->curr_cpu_temp >= cpu_temp_limits[tp->index].high_shutdown || 250 tp->curr_cpu_temp < cpu_temp_limits[tp->index].low_shutdown) { 251 do_envctrl_shutdown(tp); 252 ret = 1; 253 } 254 255 if (ret) { 256 tp->fan_todo[FAN_CPU] = FAN_FULLBLAST; 257 } else if ((tick & (8 - 1)) == 0) { 258 s8 cpu_goal_hi = cpu_temp_limits[tp->index].high_warn - 10; 259 s8 cpu_goal_lo; 260 261 cpu_goal_lo = cpu_goal_hi - 3; 262 263 /* We do not try to avoid 'too cold' events. Basically we 264 * only try to deal with over-heating and fan noise reduction. 265 */ 266 if (tp->avg_cpu_temp < cpu_goal_hi) { 267 if (tp->avg_cpu_temp >= cpu_goal_lo) 268 tp->fan_todo[FAN_CPU] = FAN_SAME; 269 else 270 tp->fan_todo[FAN_CPU] = FAN_SLOWER; 271 } else { 272 tp->fan_todo[FAN_CPU] = FAN_FASTER; 273 } 274 } else { 275 tp->fan_todo[FAN_CPU] = FAN_SAME; 276 } 277} 278 279static void analyze_temps(struct bbc_cpu_temperature *tp, unsigned long *last_warn) 280{ 281 tp->avg_amb_temp = (s8)((int)((int)tp->avg_amb_temp + (int)tp->curr_amb_temp) / 2); 282 tp->avg_cpu_temp = (s8)((int)((int)tp->avg_cpu_temp + (int)tp->curr_cpu_temp) / 2); 283 284 analyze_ambient_temp(tp, last_warn, tp->sample_tick); 285 analyze_cpu_temp(tp, last_warn, tp->sample_tick); 286 287 tp->sample_tick++; 288} 289 290static enum fan_action prioritize_fan_action(int which_fan) 291{ 292 struct bbc_cpu_temperature *tp; 293 enum fan_action decision = FAN_STATE_MAX; 294 295 /* Basically, prioritize what the temperature sensors 296 * recommend we do, and perform that action on all the 297 * fans. 298 */ 299 list_for_each_entry(tp, &all_temps, glob_list) { 300 if (tp->fan_todo[which_fan] == FAN_FULLBLAST) { 301 decision = FAN_FULLBLAST; 302 break; 303 } 304 if (tp->fan_todo[which_fan] == FAN_SAME && 305 decision != FAN_FASTER) 306 decision = FAN_SAME; 307 else if (tp->fan_todo[which_fan] == FAN_FASTER) 308 decision = FAN_FASTER; 309 else if (decision != FAN_FASTER && 310 decision != FAN_SAME && 311 tp->fan_todo[which_fan] == FAN_SLOWER) 312 decision = FAN_SLOWER; 313 } 314 if (decision == FAN_STATE_MAX) 315 decision = FAN_SAME; 316 317 return decision; 318} 319 320static int maybe_new_ambient_fan_speed(struct bbc_fan_control *fp) 321{ 322 enum fan_action decision = prioritize_fan_action(FAN_AMBIENT); 323 int ret; 324 325 if (decision == FAN_SAME) 326 return 0; 327 328 ret = 1; 329 if (decision == FAN_FULLBLAST) { 330 if (fp->system_fan_speed >= FAN_SPEED_MAX) 331 ret = 0; 332 else 333 fp->system_fan_speed = FAN_SPEED_MAX; 334 } else { 335 if (decision == FAN_FASTER) { 336 if (fp->system_fan_speed >= FAN_SPEED_MAX) 337 ret = 0; 338 else 339 fp->system_fan_speed += 2; 340 } else { 341 int orig_speed = fp->system_fan_speed; 342 343 if (orig_speed <= FAN_SPEED_MIN || 344 orig_speed <= (fp->cpu_fan_speed - 3)) 345 ret = 0; 346 else 347 fp->system_fan_speed -= 1; 348 } 349 } 350 351 return ret; 352} 353 354static int maybe_new_cpu_fan_speed(struct bbc_fan_control *fp) 355{ 356 enum fan_action decision = prioritize_fan_action(FAN_CPU); 357 int ret; 358 359 if (decision == FAN_SAME) 360 return 0; 361 362 ret = 1; 363 if (decision == FAN_FULLBLAST) { 364 if (fp->cpu_fan_speed >= FAN_SPEED_MAX) 365 ret = 0; 366 else 367 fp->cpu_fan_speed = FAN_SPEED_MAX; 368 } else { 369 if (decision == FAN_FASTER) { 370 if (fp->cpu_fan_speed >= FAN_SPEED_MAX) 371 ret = 0; 372 else { 373 fp->cpu_fan_speed += 2; 374 if (fp->system_fan_speed < 375 (fp->cpu_fan_speed - 3)) 376 fp->system_fan_speed = 377 fp->cpu_fan_speed - 3; 378 } 379 } else { 380 if (fp->cpu_fan_speed <= FAN_SPEED_MIN) 381 ret = 0; 382 else 383 fp->cpu_fan_speed -= 1; 384 } 385 } 386 387 return ret; 388} 389 390static void maybe_new_fan_speeds(struct bbc_fan_control *fp) 391{ 392 int new; 393 394 new = maybe_new_ambient_fan_speed(fp); 395 new |= maybe_new_cpu_fan_speed(fp); 396 397 if (new) 398 set_fan_speeds(fp); 399} 400 401static void fans_full_blast(void) 402{ 403 struct bbc_fan_control *fp; 404 405 /* Since we will not be monitoring things anymore, put 406 * the fans on full blast. 407 */ 408 list_for_each_entry(fp, &all_fans, glob_list) { 409 fp->cpu_fan_speed = FAN_SPEED_MAX; 410 fp->system_fan_speed = FAN_SPEED_MAX; 411 fp->psupply_fan_on = 1; 412 set_fan_speeds(fp); 413 } 414} 415 416#define POLL_INTERVAL (5 * 1000) 417static unsigned long last_warning_jiffies; 418static struct task_struct *kenvctrld_task; 419 420static int kenvctrld(void *__unused) 421{ 422 printk(KERN_INFO "bbc_envctrl: kenvctrld starting...\n"); 423 last_warning_jiffies = jiffies - WARN_INTERVAL; 424 for (;;) { 425 struct bbc_cpu_temperature *tp; 426 struct bbc_fan_control *fp; 427 428 msleep_interruptible(POLL_INTERVAL); 429 if (kthread_should_stop()) 430 break; 431 432 list_for_each_entry(tp, &all_temps, glob_list) { 433 get_current_temps(tp); 434 analyze_temps(tp, &last_warning_jiffies); 435 } 436 list_for_each_entry(fp, &all_fans, glob_list) 437 maybe_new_fan_speeds(fp); 438 } 439 printk(KERN_INFO "bbc_envctrl: kenvctrld exiting...\n"); 440 441 fans_full_blast(); 442 443 return 0; 444} 445 446static void attach_one_temp(struct bbc_i2c_bus *bp, struct platform_device *op, 447 int temp_idx) 448{ 449 struct bbc_cpu_temperature *tp; 450 451 tp = kzalloc(sizeof(*tp), GFP_KERNEL); 452 if (!tp) 453 return; 454 455 INIT_LIST_HEAD(&tp->bp_list); 456 INIT_LIST_HEAD(&tp->glob_list); 457 458 tp->client = bbc_i2c_attach(bp, op); 459 if (!tp->client) { 460 kfree(tp); 461 return; 462 } 463 464 465 tp->index = temp_idx; 466 467 list_add(&tp->glob_list, &all_temps); 468 list_add(&tp->bp_list, &bp->temps); 469 470 /* Tell it to convert once every 5 seconds, clear all cfg 471 * bits. 472 */ 473 bbc_i2c_writeb(tp->client, 0x00, MAX1617_WR_CFG_BYTE); 474 bbc_i2c_writeb(tp->client, 0x02, MAX1617_WR_CVRATE_BYTE); 475 476 /* Program the hard temperature limits into the chip. */ 477 bbc_i2c_writeb(tp->client, amb_temp_limits[tp->index].high_pwroff, 478 MAX1617_WR_AMB_HIGHLIM); 479 bbc_i2c_writeb(tp->client, amb_temp_limits[tp->index].low_pwroff, 480 MAX1617_WR_AMB_LOWLIM); 481 bbc_i2c_writeb(tp->client, cpu_temp_limits[tp->index].high_pwroff, 482 MAX1617_WR_CPU_HIGHLIM); 483 bbc_i2c_writeb(tp->client, cpu_temp_limits[tp->index].low_pwroff, 484 MAX1617_WR_CPU_LOWLIM); 485 486 get_current_temps(tp); 487 tp->prev_cpu_temp = tp->avg_cpu_temp = tp->curr_cpu_temp; 488 tp->prev_amb_temp = tp->avg_amb_temp = tp->curr_amb_temp; 489 490 tp->fan_todo[FAN_AMBIENT] = FAN_SAME; 491 tp->fan_todo[FAN_CPU] = FAN_SAME; 492} 493 494static void attach_one_fan(struct bbc_i2c_bus *bp, struct platform_device *op, 495 int fan_idx) 496{ 497 struct bbc_fan_control *fp; 498 499 fp = kzalloc(sizeof(*fp), GFP_KERNEL); 500 if (!fp) 501 return; 502 503 INIT_LIST_HEAD(&fp->bp_list); 504 INIT_LIST_HEAD(&fp->glob_list); 505 506 fp->client = bbc_i2c_attach(bp, op); 507 if (!fp->client) { 508 kfree(fp); 509 return; 510 } 511 512 fp->index = fan_idx; 513 514 list_add(&fp->glob_list, &all_fans); 515 list_add(&fp->bp_list, &bp->fans); 516 517 /* The i2c device controlling the fans is write-only. 518 * So the only way to keep track of the current power 519 * level fed to the fans is via software. Choose half 520 * power for cpu/system and 'on' fo the powersupply fan 521 * and set it now. 522 */ 523 fp->psupply_fan_on = 1; 524 fp->cpu_fan_speed = (FAN_SPEED_MAX - FAN_SPEED_MIN) / 2; 525 fp->cpu_fan_speed += FAN_SPEED_MIN; 526 fp->system_fan_speed = (FAN_SPEED_MAX - FAN_SPEED_MIN) / 2; 527 fp->system_fan_speed += FAN_SPEED_MIN; 528 529 set_fan_speeds(fp); 530} 531 532static void destroy_one_temp(struct bbc_cpu_temperature *tp) 533{ 534 bbc_i2c_detach(tp->client); 535 kfree(tp); 536} 537 538static void destroy_all_temps(struct bbc_i2c_bus *bp) 539{ 540 struct bbc_cpu_temperature *tp, *tpos; 541 542 list_for_each_entry_safe(tp, tpos, &bp->temps, bp_list) { 543 list_del(&tp->bp_list); 544 list_del(&tp->glob_list); 545 destroy_one_temp(tp); 546 } 547} 548 549static void destroy_one_fan(struct bbc_fan_control *fp) 550{ 551 bbc_i2c_detach(fp->client); 552 kfree(fp); 553} 554 555static void destroy_all_fans(struct bbc_i2c_bus *bp) 556{ 557 struct bbc_fan_control *fp, *fpos; 558 559 list_for_each_entry_safe(fp, fpos, &bp->fans, bp_list) { 560 list_del(&fp->bp_list); 561 list_del(&fp->glob_list); 562 destroy_one_fan(fp); 563 } 564} 565 566int bbc_envctrl_init(struct bbc_i2c_bus *bp) 567{ 568 struct platform_device *op; 569 int temp_index = 0; 570 int fan_index = 0; 571 int devidx = 0; 572 573 while ((op = bbc_i2c_getdev(bp, devidx++)) != NULL) { 574 if (of_node_name_eq(op->dev.of_node, "temperature")) 575 attach_one_temp(bp, op, temp_index++); 576 if (of_node_name_eq(op->dev.of_node, "fan-control")) 577 attach_one_fan(bp, op, fan_index++); 578 } 579 if (temp_index != 0 && fan_index != 0) { 580 kenvctrld_task = kthread_run(kenvctrld, NULL, "kenvctrld"); 581 if (IS_ERR(kenvctrld_task)) { 582 int err = PTR_ERR(kenvctrld_task); 583 584 kenvctrld_task = NULL; 585 destroy_all_temps(bp); 586 destroy_all_fans(bp); 587 return err; 588 } 589 } 590 591 return 0; 592} 593 594void bbc_envctrl_cleanup(struct bbc_i2c_bus *bp) 595{ 596 if (kenvctrld_task) 597 kthread_stop(kenvctrld_task); 598 599 destroy_all_temps(bp); 600 destroy_all_fans(bp); 601}