1 /**
2  * Copyright © 2017 IBM Corporation
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *     http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 #include <phosphor-logging/log.hpp>
17 #include <phosphor-logging/elog.hpp>
18 #include <org/open_power/Witherspoon/Fault/error.hpp>
19 #include <xyz/openbmc_project/Common/Device/error.hpp>
20 #include "elog-errors.hpp"
21 #include "names_values.hpp"
22 #include "power_supply.hpp"
23 #include "pmbus.hpp"
24 #include "utility.hpp"
25 
26 using namespace phosphor::logging;
27 using namespace sdbusplus::org::open_power::Witherspoon::Fault::Error;
28 using namespace sdbusplus::xyz::openbmc_project::Common::Device::Error;
29 
30 namespace witherspoon
31 {
32 namespace power
33 {
34 namespace psu
35 {
36 
37 constexpr auto INVENTORY_OBJ_PATH = "/xyz/openbmc_project/inventory";
38 constexpr auto INVENTORY_INTERFACE = "xyz.openbmc_project.Inventory.Item";
39 constexpr auto PRESENT_PROP = "Present";
40 constexpr auto POWER_OBJ_PATH = "/org/openbmc/control/power0";
41 constexpr auto POWER_INTERFACE = "org.openbmc.control.Power";
42 
43 PowerSupply::PowerSupply(const std::string& name, size_t inst,
44                          const std::string& objpath,
45                          const std::string& invpath,
46                          sdbusplus::bus::bus& bus,
47                          event::Event& e,
48                          std::chrono::seconds& t)
49     : Device(name, inst), monitorPath(objpath), pmbusIntf(objpath),
50       inventoryPath(invpath), bus(bus), event(e), powerOnInterval(t),
51       powerOnTimer(e, [this]()
52                    {
53                        this->powerOn = true;
54                    })
55 {
56     using namespace sdbusplus::bus;
57     auto present_obj_path = INVENTORY_OBJ_PATH + inventoryPath;
58     presentMatch = std::make_unique<match_t>(bus,
59                                              match::rules::propertiesChanged(
60                                                      present_obj_path,
61                                                      INVENTORY_INTERFACE),
62                                              [this](auto& msg)
63                                              {
64                                                  this->inventoryChanged(msg);
65                                              });
66     // Get initial presence state.
67     updatePresence();
68 
69     // Subscribe to power state changes
70     powerOnMatch = std::make_unique<match_t>(bus,
71                                              match::rules::propertiesChanged(
72                                                      POWER_OBJ_PATH,
73                                                      POWER_INTERFACE),
74                                              [this](auto& msg)
75                                              {
76                                                  this->powerStateChanged(msg);
77                                              });
78     // Get initial power state.
79     updatePowerState();
80 }
81 
82 void PowerSupply::captureCmd(util::NamesValues& nv, const std::string& cmd,
83                              witherspoon::pmbus::Type type)
84 {
85     if (pmbusIntf.exists(cmd, type))
86     {
87         try
88         {
89             auto val = pmbusIntf.read(cmd, type);
90             nv.add(cmd, val);
91         }
92         catch (std::exception& e)
93         {
94             log<level::INFO>("Unable to capture metadata", entry("CMD=%s",
95                                                                  cmd));
96         }
97     }
98 }
99 
100 void PowerSupply::analyze()
101 {
102     using namespace witherspoon::pmbus;
103 
104     try
105     {
106         if (present)
107         {
108             std::uint16_t statusWord = 0;
109 
110             // Read the 2 byte STATUS_WORD value to check for faults.
111             statusWord = pmbusIntf.read(STATUS_WORD, Type::Debug);
112 
113             //TODO: 3 consecutive reads should be performed.
114             // If 3 consecutive reads are seen, log the fault.
115             // Driver gives cached value, read once a second.
116             // increment for fault on, decrement for fault off, to deglitch.
117             // If count reaches 3, we have fault. If count reaches 0, fault is
118             // cleared.
119 
120             checkInputFault(statusWord);
121 
122             if (powerOn && !inputFault)
123             {
124                 checkFanFault(statusWord);
125                 checkTemperatureFault(statusWord);
126                 checkOutputOvervoltageFault(statusWord);
127                 checkCurrentOutOverCurrentFault(statusWord);
128                 checkPGOrUnitOffFault(statusWord);
129             }
130         }
131     }
132     catch (ReadFailure& e)
133     {
134         if (!readFailLogged)
135         {
136             commit<ReadFailure>();
137             readFailLogged = true;
138         }
139     }
140 
141     return;
142 }
143 
144 void PowerSupply::inventoryChanged(sdbusplus::message::message& msg)
145 {
146     std::string msgSensor;
147     std::map<std::string, sdbusplus::message::variant<uint32_t, bool>> msgData;
148     msg.read(msgSensor, msgData);
149 
150     // Check if it was the Present property that changed.
151     auto valPropMap = msgData.find(PRESENT_PROP);
152     if (valPropMap != msgData.end())
153     {
154         present = sdbusplus::message::variant_ns::get<bool>(valPropMap->second);
155 
156         if (present)
157         {
158             clearFaults();
159         }
160     }
161 
162     return;
163 }
164 
165 void PowerSupply::updatePresence()
166 {
167     // Use getProperty utility function to get presence status.
168     std::string path = INVENTORY_OBJ_PATH + inventoryPath;
169     std::string service = "xyz.openbmc_project.Inventory.Manager";
170 
171     util::getProperty(INVENTORY_INTERFACE, PRESENT_PROP, path,service, bus,
172                       this->present);
173 }
174 
175 void PowerSupply::powerStateChanged(sdbusplus::message::message& msg)
176 {
177     int32_t state = 0;
178     std::string msgSensor;
179     std::map<std::string, sdbusplus::message::variant<int32_t, int32_t>>
180             msgData;
181     msg.read(msgSensor, msgData);
182 
183     // Check if it was the Present property that changed.
184     auto valPropMap = msgData.find("state");
185     if (valPropMap != msgData.end())
186     {
187         state = sdbusplus::message::variant_ns::get<int32_t>(valPropMap->second);
188 
189         // Power is on when state=1. Set the fault logged variables to false
190         // and start the power on timer when the state changes to 1.
191         if (state)
192         {
193             clearFaults();
194             powerOnTimer.start(powerOnInterval, Timer::TimerType::oneshot);
195         }
196         else
197         {
198             powerOnTimer.stop();
199             powerOn = false;
200         }
201     }
202 
203 }
204 
205 void PowerSupply::updatePowerState()
206 {
207     // When state = 1, system is powered on
208     int32_t state = 0;
209 
210     try
211     {
212         auto service = util::getService(POWER_OBJ_PATH,
213                                         POWER_INTERFACE,
214                                         bus);
215 
216         // Use getProperty utility function to get power state.
217         util::getProperty<int32_t>(POWER_INTERFACE,
218                                    "state",
219                                    POWER_OBJ_PATH,
220                                    service,
221                                    bus,
222                                    state);
223 
224         if (state)
225         {
226             powerOn = true;
227         }
228         else
229         {
230             powerOn = false;
231         }
232     }
233     catch (std::exception& e)
234     {
235         log<level::INFO>("Failed to get power state. Assuming it is off.");
236         powerOn = false;
237     }
238 
239 }
240 
241 void PowerSupply::checkInputFault(const uint16_t statusWord)
242 {
243     using namespace witherspoon::pmbus;
244 
245     std::uint8_t  statusInput = 0;
246 
247     if (!inputFault && ((statusWord & status_word::INPUT_FAULT_WARN) ||
248         (statusWord & status_word::VIN_UV_FAULT)))
249     {
250         inputFault = true;
251 
252         util::NamesValues nv;
253         nv.add("STATUS_WORD", statusWord);
254         captureCmd(nv, STATUS_INPUT, Type::Debug);
255 
256         using metadata = org::open_power::Witherspoon::Fault::
257                 PowerSupplyInputFault;
258 
259         report<PowerSupplyInputFault>(
260                 metadata::RAW_STATUS(nv.get().c_str()),
261                 metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str()));
262     }
263     else
264     {
265         if ((inputFault) &&
266             !(statusWord & status_word::INPUT_FAULT_WARN) &&
267             !(statusWord & status_word::VIN_UV_FAULT))
268         {
269             inputFault = false;
270 
271             statusInput = pmbusIntf.read(STATUS_INPUT, Type::Debug);
272 
273             log<level::INFO>("INPUT_FAULT_WARN cleared",
274                              entry("POWERSUPPLY=%s", inventoryPath.c_str()),
275                              entry("STATUS_WORD=0x%04X", statusWord),
276                              entry("STATUS_INPUT=0x%02X", statusInput));
277 
278             if (powerOn)
279             {
280                 // The power supply will not be immediately powered on after
281                 // the input power is restored.
282                 powerOn = false;
283                 // Start up the timer that will set the state to indicate we
284                 // are ready for the powered on fault checks.
285                 powerOnTimer.start(powerOnInterval, Timer::TimerType::oneshot);
286             }
287         }
288     }
289 }
290 
291 void PowerSupply::checkPGOrUnitOffFault(const uint16_t statusWord)
292 {
293     using namespace witherspoon::pmbus;
294 
295     if (powerOnFault < FAULT_COUNT)
296     {
297         // Check PG# and UNIT_IS_OFF
298         if ((statusWord & status_word::POWER_GOOD_NEGATED) ||
299             (statusWord & status_word::UNIT_IS_OFF))
300         {
301             log<level::INFO>("PGOOD or UNIT_IS_OFF bit bad",
302                              entry("STATUS_WORD=0x%04X", statusWord));
303             powerOnFault++;
304         }
305         else
306         {
307             if (powerOnFault > 0)
308             {
309                 log<level::INFO>("PGOOD and UNIT_IS_OFF bits good");
310                 powerOnFault = 0;
311             }
312         }
313 
314         if (powerOnFault >= FAULT_COUNT)
315         {
316             util::NamesValues nv;
317             nv.add("STATUS_WORD", statusWord);
318             captureCmd(nv, STATUS_INPUT, Type::Debug);
319             auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0);
320             captureCmd(nv, status0Vout, Type::Debug);
321             captureCmd(nv, STATUS_IOUT, Type::Debug);
322             captureCmd(nv, STATUS_MFR, Type::Debug);
323 
324             using metadata = org::open_power::Witherspoon::Fault::
325                     PowerSupplyShouldBeOn;
326 
327             // A power supply is OFF (or pgood low) but should be on.
328             report<PowerSupplyShouldBeOn>(
329                     metadata::RAW_STATUS(nv.get().c_str()),
330                     metadata::CALLOUT_INVENTORY_PATH(
331                             inventoryPath.c_str()));
332         }
333     }
334 
335 }
336 
337 void PowerSupply::checkCurrentOutOverCurrentFault(const uint16_t statusWord)
338 {
339     using namespace witherspoon::pmbus;
340 
341     // Check for an output overcurrent fault.
342     if ((statusWord & status_word::IOUT_OC_FAULT) &&
343         !outputOCFault)
344     {
345         util::NamesValues nv;
346         nv.add("STATUS_WORD", statusWord);
347         captureCmd(nv, STATUS_INPUT, Type::Debug);
348         auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0);
349         captureCmd(nv, status0Vout, Type::Debug);
350         captureCmd(nv, STATUS_IOUT, Type::Debug);
351         captureCmd(nv, STATUS_MFR, Type::Debug);
352 
353         using metadata = org::open_power::Witherspoon::Fault::
354                 PowerSupplyOutputOvercurrent;
355 
356         report<PowerSupplyOutputOvercurrent>(metadata::RAW_STATUS(
357                                                      nv.get().c_str()),
358                                              metadata::CALLOUT_INVENTORY_PATH(
359                                                      inventoryPath.c_str()));
360 
361         outputOCFault = true;
362     }
363 }
364 
365 void PowerSupply::checkOutputOvervoltageFault(const uint16_t statusWord)
366 {
367     using namespace witherspoon::pmbus;
368 
369     // Check for an output overvoltage fault.
370     if ((statusWord & status_word::VOUT_OV_FAULT) &&
371         !outputOVFault)
372     {
373         util::NamesValues nv;
374         nv.add("STATUS_WORD", statusWord);
375         captureCmd(nv, STATUS_INPUT, Type::Debug);
376         auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0);
377         captureCmd(nv, status0Vout, Type::Debug);
378         captureCmd(nv, STATUS_IOUT, Type::Debug);
379         captureCmd(nv, STATUS_MFR, Type::Debug);
380 
381         using metadata = org::open_power::Witherspoon::Fault::
382                 PowerSupplyOutputOvervoltage;
383 
384         report<PowerSupplyOutputOvervoltage>(metadata::RAW_STATUS(
385                                                      nv.get().c_str()),
386                                              metadata::CALLOUT_INVENTORY_PATH(
387                                                      inventoryPath.c_str()));
388 
389         outputOVFault = true;
390     }
391 }
392 
393 void PowerSupply::checkFanFault(const uint16_t statusWord)
394 {
395     using namespace witherspoon::pmbus;
396 
397     // Check for a fan fault or warning condition
398     if ((statusWord & status_word::FAN_FAULT) &&
399         !fanFault)
400     {
401         util::NamesValues nv;
402         nv.add("STATUS_WORD", statusWord);
403         captureCmd(nv, STATUS_MFR, Type::Debug);
404         captureCmd(nv, STATUS_TEMPERATURE, Type::Debug);
405         captureCmd(nv, STATUS_FANS_1_2, Type::Debug);
406 
407         using metadata = org::open_power::Witherspoon::Fault::
408                 PowerSupplyFanFault;
409 
410         report<PowerSupplyFanFault>(
411                 metadata::RAW_STATUS(nv.get().c_str()),
412                 metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str()));
413 
414         fanFault = true;
415     }
416 }
417 
418 void PowerSupply::checkTemperatureFault(const uint16_t statusWord)
419 {
420     using namespace witherspoon::pmbus;
421 
422     // Due to how the PMBus core device driver sends a clear faults command
423     // the bit in STATUS_WORD will likely be cleared when we attempt to examine
424     // it for a Thermal Fault or Warning. So, check the STATUS_WORD and the
425     // STATUS_TEMPERATURE bits. If either indicates a fault, proceed with
426     // logging the over-temperature condition.
427     std::uint8_t statusTemperature = 0;
428     statusTemperature = pmbusIntf.read(STATUS_TEMPERATURE, Type::Debug);
429     if (((statusWord & status_word::TEMPERATURE_FAULT_WARN) ||
430          (statusTemperature & status_temperature::OT_FAULT)) &&
431         !temperatureFault)
432     {
433         // The power supply has had an over-temperature condition.
434         // This may not result in a shutdown if experienced for a short
435         // duration.
436         // This should not occur under normal conditions.
437         // The power supply may be faulty, or the paired supply may be putting
438         // out less current.
439         // Capture command responses with potentially relevant information,
440         // and call out the power supply reporting the condition.
441         util::NamesValues nv;
442         nv.add("STATUS_WORD", statusWord);
443         captureCmd(nv, STATUS_MFR, Type::Debug);
444         captureCmd(nv, STATUS_IOUT, Type::Debug);
445         nv.add("STATUS_TEMPERATURE", statusTemperature);
446         captureCmd(nv, STATUS_FANS_1_2, Type::Debug);
447 
448         using metadata = org::open_power::Witherspoon::Fault::
449                 PowerSupplyTemperatureFault;
450 
451         report<PowerSupplyTemperatureFault>(
452                 metadata::RAW_STATUS(nv.get().c_str()),
453                 metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str()));
454 
455         temperatureFault = true;
456     }
457 }
458 
459 void PowerSupply::clearFaults()
460 {
461     readFailLogged = false;
462     inputFault = false;
463     powerOnFault = 0;
464     outputOCFault = false;
465     outputOVFault = false;
466     fanFault = false;
467     temperatureFault = false;
468 
469     return;
470 }
471 
472 }
473 }
474 }
475