1 /** 2 * Copyright 2017 Google Inc. 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 /* Configuration. */ 18 #include "zone.hpp" 19 20 #include "conf.hpp" 21 #include "failsafeloggers/failsafe_logger_utility.hpp" 22 #include "pid/controller.hpp" 23 #include "pid/ec/pid.hpp" 24 #include "pid/fancontroller.hpp" 25 #include "pid/stepwisecontroller.hpp" 26 #include "pid/thermalcontroller.hpp" 27 #include "pid/tuning.hpp" 28 29 #include <algorithm> 30 #include <chrono> 31 #include <cstring> 32 #include <fstream> 33 #include <iostream> 34 #include <memory> 35 #include <sstream> 36 #include <string> 37 38 using tstamp = std::chrono::high_resolution_clock::time_point; 39 using namespace std::literals::chrono_literals; 40 41 // Enforces minimum duration between events 42 // Rreturns true if event should be allowed, false if disallowed 43 bool allowThrottle(const tstamp& now, const std::chrono::seconds& pace) 44 { 45 static tstamp then; 46 static bool first = true; 47 48 if (first) 49 { 50 // Special case initialization 51 then = now; 52 first = false; 53 54 // Initialization, always allow 55 return true; 56 } 57 58 auto elapsed = now - then; 59 if (elapsed < pace) 60 { 61 // Too soon since last time, disallow 62 return false; 63 } 64 65 // It has been long enough, allow 66 then = now; 67 return true; 68 } 69 70 namespace pid_control 71 { 72 73 double DbusPidZone::getMaxSetPointRequest(void) const 74 { 75 return _maximumSetPoint; 76 } 77 78 bool DbusPidZone::getManualMode(void) const 79 { 80 return _manualMode; 81 } 82 83 void DbusPidZone::setManualMode(bool mode) 84 { 85 _manualMode = mode; 86 87 // If returning to automatic mode, need to restore PWM from PID loop 88 if (!mode) 89 { 90 _redundantWrite = true; 91 } 92 } 93 94 bool DbusPidZone::getFailSafeMode(void) const 95 { 96 // If any keys are present at least one sensor is in fail safe mode. 97 return !_failSafeSensors.empty(); 98 } 99 100 FailSafeSensorsMap DbusPidZone::getFailSafeSensors(void) const 101 { 102 return _failSafeSensors; 103 } 104 105 void DbusPidZone::markSensorMissing(const std::string& name, 106 const std::string& failReason) 107 { 108 if (_missingAcceptable.find(name) != _missingAcceptable.end()) 109 { 110 // Disallow sensors in MissingIsAcceptable list from causing failsafe 111 outputFailsafeLogWithZone(_zoneId, this->getFailSafeMode(), name, 112 "The sensor is missing but is acceptable."); 113 return; 114 } 115 116 if (_sensorFailSafePercent[name] == 0) 117 { 118 _failSafeSensors[name] = std::pair(failReason, _zoneFailSafePercent); 119 } 120 else 121 { 122 _failSafeSensors[name] = 123 std::pair(failReason, _sensorFailSafePercent[name]); 124 } 125 126 if (debugEnabled) 127 { 128 std::cerr << "Sensor " << name << " marked missing\n"; 129 } 130 } 131 132 int64_t DbusPidZone::getZoneID(void) const 133 { 134 return _zoneId; 135 } 136 137 void DbusPidZone::addSetPoint(double setPoint, const std::string& name) 138 { 139 /* exclude disabled pidloop from _maximumSetPoint calculation*/ 140 if (!isPidProcessEnabled(name)) 141 { 142 return; 143 } 144 145 auto profileName = name; 146 if (getAccSetPoint()) 147 { 148 /* 149 * If the name of controller is Linear_Temp_CPU0. 150 * The profile name will be Temp_CPU0. 151 */ 152 profileName = name.substr(name.find("_") + 1); 153 _SetPoints[profileName] += setPoint; 154 } 155 else 156 { 157 if (_SetPoints[profileName] < setPoint) 158 { 159 _SetPoints[profileName] = setPoint; 160 } 161 } 162 163 /* 164 * if there are multiple thermal controllers with the same 165 * value, pick the first one in the iterator 166 */ 167 if (_maximumSetPoint < _SetPoints[profileName]) 168 { 169 _maximumSetPoint = _SetPoints[profileName]; 170 _maximumSetPointName = profileName; 171 } 172 } 173 174 void DbusPidZone::addRPMCeiling(double ceiling) 175 { 176 _RPMCeilings.push_back(ceiling); 177 } 178 179 void DbusPidZone::clearRPMCeilings(void) 180 { 181 _RPMCeilings.clear(); 182 } 183 184 void DbusPidZone::clearSetPoints(void) 185 { 186 _SetPoints.clear(); 187 _maximumSetPoint = 0; 188 _maximumSetPointName.clear(); 189 } 190 191 double DbusPidZone::getFailSafePercent(void) 192 { 193 if (_failSafeSensors.empty()) 194 { 195 return _zoneFailSafePercent; 196 } 197 198 FailSafeSensorsMap::iterator maxData = std::max_element( 199 _failSafeSensors.begin(), _failSafeSensors.end(), 200 [](const FailSafeSensorPair firstData, 201 const FailSafeSensorPair secondData) { 202 return firstData.second.second < secondData.second.second; 203 }); 204 205 // In dbus/dbusconfiguration.cpp, the default sensor failsafepercent is 0 if 206 // there is no setting in json. 207 // Therfore, if the max failsafe duty in _failSafeSensors is 0, set final 208 // failsafe duty to _zoneFailSafePercent. 209 if ((*maxData).second.second == 0) 210 { 211 return _zoneFailSafePercent; 212 } 213 else 214 { 215 return (*maxData).second.second; 216 } 217 } 218 219 double DbusPidZone::getMinThermalSetPoint(void) const 220 { 221 return _minThermalOutputSetPt; 222 } 223 224 uint64_t DbusPidZone::getCycleIntervalTime(void) const 225 { 226 return _cycleTime.cycleIntervalTimeMS; 227 } 228 229 uint64_t DbusPidZone::getUpdateThermalsCycle(void) const 230 { 231 return _cycleTime.updateThermalsTimeMS; 232 } 233 234 void DbusPidZone::addFanPID(std::unique_ptr<Controller> pid) 235 { 236 _fans.push_back(std::move(pid)); 237 } 238 239 void DbusPidZone::addThermalPID(std::unique_ptr<Controller> pid) 240 { 241 _thermals.push_back(std::move(pid)); 242 } 243 244 double DbusPidZone::getCachedValue(const std::string& name) 245 { 246 return _cachedValuesByName.at(name).scaled; 247 } 248 249 ValueCacheEntry DbusPidZone::getCachedValues(const std::string& name) 250 { 251 return _cachedValuesByName.at(name); 252 } 253 254 void DbusPidZone::setOutputCache(std::string_view name, 255 const ValueCacheEntry& values) 256 { 257 _cachedFanOutputs[std::string{name}] = values; 258 } 259 260 void DbusPidZone::addFanInput(const std::string& fan, bool missingAcceptable) 261 { 262 _fanInputs.push_back(fan); 263 264 if (missingAcceptable) 265 { 266 _missingAcceptable.emplace(fan); 267 } 268 } 269 270 void DbusPidZone::addThermalInput(const std::string& therm, 271 bool missingAcceptable) 272 { 273 /* 274 * One sensor may have stepwise and PID at the same time. 275 * Searching the sensor name before inserting it to avoid duplicated sensor 276 * names. 277 */ 278 if (std::find(_thermalInputs.begin(), _thermalInputs.end(), therm) == 279 _thermalInputs.end()) 280 { 281 _thermalInputs.push_back(therm); 282 } 283 284 if (missingAcceptable) 285 { 286 _missingAcceptable.emplace(therm); 287 } 288 } 289 290 // Updates desired RPM setpoint from optional text file 291 // Returns true if rpmValue updated, false if left unchanged 292 static bool fileParseRpm(const std::string& fileName, double& rpmValue) 293 { 294 static constexpr std::chrono::seconds throttlePace{3}; 295 296 std::string errText; 297 298 try 299 { 300 std::ifstream ifs; 301 ifs.open(fileName); 302 if (ifs) 303 { 304 int value; 305 ifs >> value; 306 307 if (value <= 0) 308 { 309 errText = "File content could not be parsed to a number"; 310 } 311 else if (value <= 100) 312 { 313 errText = "File must contain RPM value, not PWM value"; 314 } 315 else 316 { 317 rpmValue = static_cast<double>(value); 318 return true; 319 } 320 } 321 } 322 catch (const std::exception& e) 323 { 324 errText = "Exception: "; 325 errText += e.what(); 326 } 327 328 // The file is optional, intentionally not an error if file not found 329 if (!(errText.empty())) 330 { 331 tstamp now = std::chrono::high_resolution_clock::now(); 332 if (allowThrottle(now, throttlePace)) 333 { 334 std::cerr << "Unable to read from '" << fileName << "': " << errText 335 << "\n"; 336 } 337 } 338 339 return false; 340 } 341 342 void DbusPidZone::determineMaxSetPointRequest(void) 343 { 344 std::vector<double>::iterator result; 345 double minThermalThreshold = getMinThermalSetPoint(); 346 347 if (_RPMCeilings.size() > 0) 348 { 349 result = std::min_element(_RPMCeilings.begin(), _RPMCeilings.end()); 350 // if Max set point is larger than the lowest ceiling, reset to lowest 351 // ceiling. 352 if (*result < _maximumSetPoint) 353 { 354 _maximumSetPoint = *result; 355 // When using lowest ceiling, controller name is ceiling. 356 _maximumSetPointName = "Ceiling"; 357 } 358 } 359 360 /* 361 * Combine the maximum SetPoint Name if the controllers have same profile 362 * name. e.g., PID_BB_INLET_TEMP_C + Stepwise_BB_INLET_TEMP_C. 363 */ 364 if (getAccSetPoint()) 365 { 366 auto profileName = _maximumSetPointName; 367 _maximumSetPointName = ""; 368 369 for (auto& p : _thermals) 370 { 371 auto controllerID = p->getID(); 372 auto found = controllerID.find(profileName); 373 if (found != std::string::npos) 374 { 375 if (_maximumSetPointName.empty()) 376 { 377 _maximumSetPointName = controllerID; 378 } 379 else 380 { 381 _maximumSetPointName += " + " + controllerID; 382 } 383 } 384 } 385 } 386 387 /* 388 * If the maximum RPM setpoint output is below the minimum RPM 389 * setpoint, set it to the minimum. 390 */ 391 if (minThermalThreshold >= _maximumSetPoint) 392 { 393 _maximumSetPoint = minThermalThreshold; 394 _maximumSetPointName = "Minimum"; 395 } 396 else if (_maximumSetPointName.compare(_maximumSetPointNamePrev)) 397 { 398 std::cerr << "PID Zone " << _zoneId << " max SetPoint " 399 << _maximumSetPoint << " requested by " 400 << _maximumSetPointName; 401 for (const auto& sensor : _failSafeSensors) 402 { 403 if (sensor.first.find("Fan") == std::string::npos) 404 { 405 std::cerr << " " << sensor.first; 406 } 407 } 408 std::cerr << "\n"; 409 _maximumSetPointNamePrev.assign(_maximumSetPointName); 410 } 411 if (tuningEnabled) 412 { 413 /* 414 * We received no setpoints from thermal sensors. 415 * This is a case experienced during tuning where they only specify 416 * fan sensors and one large fan PID for all the fans. 417 */ 418 static constexpr auto setpointpath = "/etc/thermal.d/setpoint"; 419 420 fileParseRpm(setpointpath, _maximumSetPoint); 421 422 // Allow per-zone setpoint files to override overall setpoint file 423 std::ostringstream zoneSuffix; 424 zoneSuffix << ".zone" << _zoneId; 425 std::string zoneSetpointPath = setpointpath + zoneSuffix.str(); 426 427 fileParseRpm(zoneSetpointPath, _maximumSetPoint); 428 } 429 return; 430 } 431 432 void DbusPidZone::initializeLog(void) 433 { 434 /* Print header for log file: 435 * epoch_ms,setpt,fan1,fan1_raw,fan1_pwm,fan1_pwm_raw,fan2,fan2_raw,fan2_pwm,fan2_pwm_raw,fanN,fanN_raw,fanN_pwm,fanN_pwm_raw,sensor1,sensor1_raw,sensor2,sensor2_raw,sensorN,sensorN_raw,failsafe 436 */ 437 438 _log << "epoch_ms,setpt,requester"; 439 440 for (const auto& f : _fanInputs) 441 { 442 _log << "," << f << "," << f << "_raw"; 443 _log << "," << f << "_pwm," << f << "_pwm_raw"; 444 } 445 for (const auto& t : _thermalInputs) 446 { 447 _log << "," << t << "," << t << "_raw"; 448 } 449 450 _log << ",failsafe"; 451 _log << std::endl; 452 } 453 454 void DbusPidZone::writeLog(const std::string& value) 455 { 456 _log << value; 457 } 458 459 /* 460 * TODO(venture) This is effectively updating the cache and should check if the 461 * values they're using to update it are new or old, or whatnot. For instance, 462 * if we haven't heard from the host in X time we need to detect this failure. 463 * 464 * I haven't decided if the Sensor should have a lastUpdated method or whether 465 * that should be for the ReadInterface or etc... 466 */ 467 468 /** 469 * We want the PID loop to run with values cached, so this will get all the 470 * fan tachs for the loop. 471 */ 472 void DbusPidZone::updateFanTelemetry(void) 473 { 474 /* TODO(venture): Should I just make _log point to /dev/null when logging 475 * is disabled? I think it's a waste to try and log things even if the 476 * data is just being dropped though. 477 */ 478 const auto now = std::chrono::high_resolution_clock::now(); 479 if (loggingEnabled) 480 { 481 _log << std::chrono::duration_cast<std::chrono::milliseconds>( 482 now.time_since_epoch()) 483 .count(); 484 _log << "," << _maximumSetPoint; 485 _log << "," << _maximumSetPointName; 486 } 487 488 processSensorInputs</* fanSensorLogging */ true>(_fanInputs, now); 489 490 if (loggingEnabled) 491 { 492 for (const auto& t : _thermalInputs) 493 { 494 const auto& v = _cachedValuesByName[t]; 495 _log << "," << v.scaled << "," << v.unscaled; 496 } 497 } 498 499 return; 500 } 501 502 void DbusPidZone::updateSensors(void) 503 { 504 processSensorInputs</* fanSensorLogging */ false>( 505 _thermalInputs, std::chrono::high_resolution_clock::now()); 506 507 return; 508 } 509 510 void DbusPidZone::initializeCache(void) 511 { 512 auto nan = std::numeric_limits<double>::quiet_NaN(); 513 514 for (const auto& f : _fanInputs) 515 { 516 _cachedValuesByName[f] = {nan, nan}; 517 _cachedFanOutputs[f] = {nan, nan}; 518 519 // Start all fans in fail-safe mode. 520 markSensorMissing(f, ""); 521 } 522 523 for (const auto& t : _thermalInputs) 524 { 525 _cachedValuesByName[t] = {nan, nan}; 526 527 // Start all sensors in fail-safe mode. 528 markSensorMissing(t, ""); 529 } 530 } 531 532 void DbusPidZone::dumpCache(void) 533 { 534 std::cerr << "Cache values now: \n"; 535 for (const auto& [name, value] : _cachedValuesByName) 536 { 537 std::cerr << name << ": " << value.scaled << " " << value.unscaled 538 << "\n"; 539 } 540 541 std::cerr << "Fan outputs now: \n"; 542 for (const auto& [name, value] : _cachedFanOutputs) 543 { 544 std::cerr << name << ": " << value.scaled << " " << value.unscaled 545 << "\n"; 546 } 547 } 548 549 void DbusPidZone::processFans(void) 550 { 551 for (auto& p : _fans) 552 { 553 p->process(); 554 } 555 556 if (_redundantWrite) 557 { 558 // This is only needed once 559 _redundantWrite = false; 560 } 561 } 562 563 void DbusPidZone::processThermals(void) 564 { 565 for (auto& p : _thermals) 566 { 567 p->process(); 568 } 569 } 570 571 Sensor* DbusPidZone::getSensor(const std::string& name) 572 { 573 return _mgr.getSensor(name); 574 } 575 576 std::vector<std::string> DbusPidZone::getSensorNames(void) 577 { 578 return _thermalInputs; 579 } 580 581 bool DbusPidZone::getRedundantWrite(void) const 582 { 583 return _redundantWrite; 584 } 585 586 bool DbusPidZone::manual(bool value) 587 { 588 std::cerr << "manual: " << value << std::endl; 589 setManualMode(value); 590 return ModeObject::manual(value); 591 } 592 593 bool DbusPidZone::failSafe() const 594 { 595 return getFailSafeMode(); 596 } 597 598 void DbusPidZone::addPidControlProcess(std::string name, std::string type, 599 double setpoint, sdbusplus::bus_t& bus, 600 std::string objPath, bool defer) 601 { 602 _pidsControlProcess[name] = std::make_unique<ProcessObject>( 603 bus, objPath.c_str(), 604 defer ? ProcessObject::action::defer_emit 605 : ProcessObject::action::emit_object_added); 606 // Default enable setting = true 607 _pidsControlProcess[name]->enabled(true); 608 _pidsControlProcess[name]->setpoint(setpoint); 609 610 if (type == "temp") 611 { 612 _pidsControlProcess[name]->classType("Temperature"); 613 } 614 else if (type == "margin") 615 { 616 _pidsControlProcess[name]->classType("Margin"); 617 } 618 else if (type == "power") 619 { 620 _pidsControlProcess[name]->classType("Power"); 621 } 622 else if (type == "powersum") 623 { 624 _pidsControlProcess[name]->classType("PowerSum"); 625 } 626 } 627 628 bool DbusPidZone::isPidProcessEnabled(std::string name) 629 { 630 return _pidsControlProcess[name]->enabled(); 631 } 632 633 void DbusPidZone::addPidFailSafePercent(std::vector<std::string> inputs, 634 double percent) 635 { 636 for (const auto& sensorName : inputs) 637 { 638 if (_sensorFailSafePercent.find(sensorName) != 639 _sensorFailSafePercent.end()) 640 { 641 _sensorFailSafePercent[sensorName] = 642 std::max(_sensorFailSafePercent[sensorName], percent); 643 if (debugEnabled) 644 { 645 std::cerr << "Sensor " << sensorName 646 << " failsafe percent updated to " 647 << _sensorFailSafePercent[sensorName] << "\n"; 648 } 649 } 650 else 651 { 652 _sensorFailSafePercent[sensorName] = percent; 653 if (debugEnabled) 654 { 655 std::cerr << "Sensor " << sensorName 656 << " failsafe percent set to " << percent << "\n"; 657 } 658 } 659 } 660 } 661 662 std::string DbusPidZone::leader() const 663 { 664 return _maximumSetPointName; 665 } 666 667 void DbusPidZone::updateThermalPowerDebugInterface( 668 std::string pidName, std::string leader, double input, double output) 669 { 670 if (leader.empty()) 671 { 672 _pidsControlProcess[pidName]->output(output); 673 } 674 else 675 { 676 _pidsControlProcess[pidName]->leader(leader); 677 _pidsControlProcess[pidName]->input(input); 678 } 679 } 680 681 bool DbusPidZone::getAccSetPoint(void) const 682 { 683 return _accumulateSetPoint; 684 } 685 686 } // namespace pid_control 687