1 /** 2 * Copyright 2017 Google Inc. 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 #include "dbuspassive.hpp" 17 18 #include "dbushelper_interface.hpp" 19 #include "dbuspassiveredundancy.hpp" 20 #include "dbusutil.hpp" 21 #include "util.hpp" 22 23 #include <sdbusplus/bus.hpp> 24 25 #include <chrono> 26 #include <cmath> 27 #include <memory> 28 #include <mutex> 29 #include <string> 30 #include <variant> 31 32 namespace pid_control 33 { 34 35 std::unique_ptr<ReadInterface> DbusPassive::createDbusPassive( 36 sdbusplus::bus_t& bus, const std::string& type, const std::string& id, 37 std::unique_ptr<DbusHelperInterface> helper, const conf::SensorConfig* info, 38 const std::shared_ptr<DbusPassiveRedundancy>& redundancy) 39 { 40 if (helper == nullptr) 41 { 42 return nullptr; 43 } 44 if (!validType(type)) 45 { 46 return nullptr; 47 } 48 49 /* Need to get the scale and initial value */ 50 /* service == busname */ 51 std::string path; 52 if (info->readPath.empty()) 53 { 54 path = getSensorPath(type, id); 55 } 56 else 57 { 58 path = info->readPath; 59 } 60 61 SensorProperties settings; 62 bool failed; 63 64 try 65 { 66 std::string service = helper->getService(sensorintf, path); 67 68 helper->getProperties(service, path, &settings); 69 failed = helper->thresholdsAsserted(service, path); 70 } 71 catch (const std::exception& e) 72 { 73 return nullptr; 74 } 75 76 /* if these values are zero, they're ignored. */ 77 if (info->ignoreDbusMinMax) 78 { 79 settings.min = 0; 80 settings.max = 0; 81 } 82 83 settings.unavailableAsFailed = info->unavailableAsFailed; 84 85 return std::make_unique<DbusPassive>(bus, type, id, std::move(helper), 86 settings, failed, path, redundancy); 87 } 88 89 DbusPassive::DbusPassive( 90 sdbusplus::bus_t& bus, const std::string& type, const std::string& id, 91 std::unique_ptr<DbusHelperInterface> helper, 92 const SensorProperties& settings, bool failed, const std::string& path, 93 const std::shared_ptr<DbusPassiveRedundancy>& redundancy) : 94 ReadInterface(), 95 _signal(bus, getMatch(path).c_str(), dbusHandleSignal, this), _id(id), 96 _helper(std::move(helper)), _failed(failed), path(path), 97 redundancy(redundancy) 98 99 { 100 _scale = settings.scale; 101 _min = settings.min * std::pow(10.0, _scale); 102 _max = settings.max * std::pow(10.0, _scale); 103 _available = settings.available; 104 _unavailableAsFailed = settings.unavailableAsFailed; 105 106 // Cache this type knowledge, to avoid repeated string comparison 107 _typeMargin = (type == "margin"); 108 _typeFan = (type == "fan"); 109 110 // Force value to be stored, otherwise member would be uninitialized 111 updateValue(settings.value, true); 112 } 113 114 ReadReturn DbusPassive::read(void) 115 { 116 std::lock_guard<std::mutex> guard(_lock); 117 118 ReadReturn r = {_value, _updated, _unscaled}; 119 120 return r; 121 } 122 123 void DbusPassive::setValue(double value, double unscaled) 124 { 125 std::lock_guard<std::mutex> guard(_lock); 126 127 _value = value; 128 _unscaled = unscaled; 129 _updated = std::chrono::high_resolution_clock::now(); 130 } 131 132 void DbusPassive::setValue(double value) 133 { 134 // First param is scaled, second param is unscaled, assume same here 135 setValue(value, value); 136 } 137 138 bool DbusPassive::getFailed(void) const 139 { 140 if (redundancy) 141 { 142 const std::set<std::string>& failures = redundancy->getFailed(); 143 if (failures.find(path) != failures.end()) 144 { 145 return true; 146 } 147 } 148 149 /* 150 * Unavailable thermal sensors, who are not present or 151 * power-state-not-matching, should not trigger the failSafe mode. For 152 * example, when a system stays at a powered-off state, its CPU Temp 153 * sensors will be unavailable, these unavailable sensors should not be 154 * treated as failed and trigger failSafe. 155 * This is important for systems whose Fans are always on. 156 */ 157 if (!_typeFan && !_available && !_unavailableAsFailed) 158 { 159 return false; 160 } 161 162 // If a reading has came in, 163 // but its value bad in some way (determined by sensor type), 164 // indicate this sensor has failed, 165 // until another value comes in that is no longer bad. 166 // This is different from the overall _failed flag, 167 // which is set and cleared by other causes. 168 if (_badReading) 169 { 170 return true; 171 } 172 173 // If a reading has came in, and it is not a bad reading, 174 // but it indicates there is no more thermal margin left, 175 // that is bad, something is wrong with the PID loops, 176 // they are not cooling the system, enable failsafe mode also. 177 if (_marginHot) 178 { 179 return true; 180 } 181 182 return _failed || !_available || !_functional; 183 } 184 185 void DbusPassive::setFailed(bool value) 186 { 187 _failed = value; 188 } 189 190 void DbusPassive::setFunctional(bool value) 191 { 192 _functional = value; 193 } 194 195 void DbusPassive::setAvailable(bool value) 196 { 197 _available = value; 198 } 199 200 int64_t DbusPassive::getScale(void) 201 { 202 return _scale; 203 } 204 205 std::string DbusPassive::getID(void) 206 { 207 return _id; 208 } 209 210 double DbusPassive::getMax(void) 211 { 212 return _max; 213 } 214 215 double DbusPassive::getMin(void) 216 { 217 return _min; 218 } 219 220 void DbusPassive::updateValue(double value, bool force) 221 { 222 _badReading = false; 223 224 // Do not let a NAN, or other floating-point oddity, be used to update 225 // the value, as that indicates the sensor has no valid reading. 226 if (!(std::isfinite(value))) 227 { 228 _badReading = true; 229 230 // Do not continue with a bad reading, unless caller forcing 231 if (!force) 232 { 233 return; 234 } 235 } 236 237 value *= std::pow(10.0, _scale); 238 239 auto unscaled = value; 240 scaleSensorReading(_min, _max, value); 241 242 if (_typeMargin) 243 { 244 _marginHot = false; 245 246 // Unlike an absolute temperature sensor, 247 // where 0 degrees C is a good reading, 248 // a value received of 0 (or negative) margin is worrisome, 249 // and should be flagged. 250 // Either it indicates margin not calculated properly, 251 // or somebody forgot to set the margin-zero setpoint, 252 // or the system is really overheating that much. 253 // This is a different condition from _failed 254 // and _badReading, so it merits its own flag. 255 // The sensor has not failed, the reading is good, but the zone 256 // still needs to know that it should go to failsafe mode. 257 if (unscaled <= 0.0) 258 { 259 _marginHot = true; 260 } 261 } 262 263 setValue(value, unscaled); 264 } 265 266 int handleSensorValue(sdbusplus::message_t& msg, DbusPassive* owner) 267 { 268 std::string msgSensor; 269 std::map<std::string, std::variant<int64_t, double, bool>> msgData; 270 271 msg.read(msgSensor, msgData); 272 273 if (msgSensor == "xyz.openbmc_project.Sensor.Value") 274 { 275 auto valPropMap = msgData.find("Value"); 276 if (valPropMap != msgData.end()) 277 { 278 double value = std::visit(VariantToDoubleVisitor(), 279 valPropMap->second); 280 281 owner->updateValue(value, false); 282 } 283 } 284 else if (msgSensor == "xyz.openbmc_project.Sensor.Threshold.Critical") 285 { 286 auto criticalAlarmLow = msgData.find("CriticalAlarmLow"); 287 auto criticalAlarmHigh = msgData.find("CriticalAlarmHigh"); 288 if (criticalAlarmHigh == msgData.end() && 289 criticalAlarmLow == msgData.end()) 290 { 291 return 0; 292 } 293 294 bool asserted = false; 295 if (criticalAlarmLow != msgData.end()) 296 { 297 asserted = std::get<bool>(criticalAlarmLow->second); 298 } 299 300 // checking both as in theory you could de-assert one threshold and 301 // assert the other at the same moment 302 if (!asserted && criticalAlarmHigh != msgData.end()) 303 { 304 asserted = std::get<bool>(criticalAlarmHigh->second); 305 } 306 owner->setFailed(asserted); 307 } 308 else if (msgSensor == "xyz.openbmc_project.State.Decorator.Availability") 309 { 310 auto available = msgData.find("Available"); 311 if (available == msgData.end()) 312 { 313 return 0; 314 } 315 bool asserted = std::get<bool>(available->second); 316 owner->setAvailable(asserted); 317 if (!asserted) 318 { 319 // A thermal controller will continue its PID calculation and not 320 // trigger a 'failsafe' when some inputs are unavailable. 321 // So, forced to clear the value here to prevent a historical 322 // value to participate in a latter PID calculation. 323 owner->updateValue(std::numeric_limits<double>::quiet_NaN(), true); 324 } 325 } 326 else if (msgSensor == 327 "xyz.openbmc_project.State.Decorator.OperationalStatus") 328 { 329 auto functional = msgData.find("Functional"); 330 if (functional == msgData.end()) 331 { 332 return 0; 333 } 334 bool asserted = std::get<bool>(functional->second); 335 owner->setFunctional(asserted); 336 } 337 338 return 0; 339 } 340 341 int dbusHandleSignal(sd_bus_message* msg, void* usrData, 342 [[maybe_unused]] sd_bus_error* err) 343 { 344 auto sdbpMsg = sdbusplus::message_t(msg); 345 DbusPassive* obj = static_cast<DbusPassive*>(usrData); 346 347 return handleSensorValue(sdbpMsg, obj); 348 } 349 350 } // namespace pid_control 351