/** * Copyright © 2017 IBM Corporation * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "config.h" #include "power_supply.hpp" #include "elog-errors.hpp" #include "gpio.hpp" #include "names_values.hpp" #include "pmbus.hpp" #include "types.hpp" #include "utility.hpp" #include #include #include #include namespace phosphor { namespace power { namespace psu { using namespace phosphor::logging; using namespace sdbusplus::org::open_power::Witherspoon::Fault::Error; using namespace sdbusplus::xyz::openbmc_project::Common::Device::Error; PowerSupply::PowerSupply(const std::string& name, size_t inst, const std::string& objpath, const std::string& invpath, sdbusplus::bus_t& bus, const sdeventplus::Event& e, std::chrono::seconds& t, std::chrono::seconds& p) : Device(name, inst), monitorPath(objpath), pmbusIntf(objpath), inventoryPath(INVENTORY_OBJ_PATH + invpath), bus(bus), presentInterval(p), presentTimer(e, std::bind([this]() { // The hwmon path may have changed. pmbusIntf.findHwmonDir(); this->present = true; // Sync the INPUT_HISTORY data for all PSs syncHistory(); // Update the inventory for the new device updateInventory(); })), powerOnInterval(t), powerOnTimer(e, std::bind([this]() { this->powerOn = true; })) { getAccessType(); using namespace sdbusplus::bus; using namespace phosphor::pmbus; std::uint16_t statusWord = 0; try { // Read the 2 byte STATUS_WORD value to check for faults. statusWord = pmbusIntf.read(STATUS_WORD, Type::Debug); if (!((statusWord & status_word::INPUT_FAULT_WARN) || (statusWord & status_word::VIN_UV_FAULT))) { resolveError(inventoryPath, std::string(PowerSupplyInputFault::errName)); } } catch (const ReadFailure& e) { log("Unable to read the 2 byte STATUS_WORD value to check " "for power-supply input faults."); } presentMatch = std::make_unique( bus, match::rules::propertiesChanged(inventoryPath, INVENTORY_IFACE), [this](auto& msg) { this->inventoryChanged(msg); }); // Get initial presence state. updatePresence(); // Write the SN, PN, etc to the inventory updateInventory(); // Subscribe to power state changes powerOnMatch = std::make_unique( bus, match::rules::propertiesChanged(POWER_OBJ_PATH, POWER_IFACE), [this](auto& msg) { this->powerStateChanged(msg); }); // Get initial power state. updatePowerState(); } void PowerSupply::getAccessType() { using namespace phosphor::power::util; fruJson = loadJSONFromFile(PSU_JSON_PATH); if (fruJson == nullptr) { log("InternalFailure when parsing the JSON file"); return; } inventoryPMBusAccessType = getPMBusAccessType(fruJson); } void PowerSupply::captureCmd(util::NamesValues& nv, const std::string& cmd, phosphor::pmbus::Type type) { if (pmbusIntf.exists(cmd, type)) { try { auto val = pmbusIntf.read(cmd, type); nv.add(cmd, val); } catch (const std::exception& e) { log("Unable to capture metadata", entry("CMD=%s", cmd.c_str())); } } } void PowerSupply::analyze() { using namespace phosphor::pmbus; try { if (present) { std::uint16_t statusWord = 0; // Read the 2 byte STATUS_WORD value to check for faults. statusWord = pmbusIntf.read(STATUS_WORD, Type::Debug); readFail = 0; checkInputFault(statusWord); if (powerOn && (inputFault == 0) && !faultFound) { checkFanFault(statusWord); checkTemperatureFault(statusWord); checkOutputOvervoltageFault(statusWord); checkCurrentOutOverCurrentFault(statusWord); checkPGOrUnitOffFault(statusWord); } updateHistory(); } } catch (const ReadFailure& e) { if (readFail < FAULT_COUNT) { readFail++; } if (!readFailLogged && readFail >= FAULT_COUNT) { commit(); readFailLogged = true; } } return; } void PowerSupply::inventoryChanged(sdbusplus::message_t& msg) { std::string msgSensor; std::map> msgData; msg.read(msgSensor, msgData); // Check if it was the Present property that changed. auto valPropMap = msgData.find(PRESENT_PROP); if (valPropMap != msgData.end()) { if (std::get(valPropMap->second)) { clearFaults(); presentTimer.restartOnce(presentInterval); } else { present = false; presentTimer.setEnabled(false); // Clear out the now outdated inventory properties updateInventory(); } } return; } void PowerSupply::updatePresence() { // Use getProperty utility function to get presence status. std::string service = "xyz.openbmc_project.Inventory.Manager"; util::getProperty(INVENTORY_IFACE, PRESENT_PROP, inventoryPath, service, bus, this->present); } void PowerSupply::powerStateChanged(sdbusplus::message_t& msg) { int32_t state = 0; std::string msgSensor; std::map> msgData; msg.read(msgSensor, msgData); // Check if it was the Present property that changed. auto valPropMap = msgData.find("state"); if (valPropMap != msgData.end()) { state = std::get(valPropMap->second); // Power is on when state=1. Set the fault logged variables to false // and start the power on timer when the state changes to 1. if (state) { clearFaults(); powerOnTimer.restartOnce(powerOnInterval); } else { powerOnTimer.setEnabled(false); powerOn = false; } } } void PowerSupply::updatePowerState() { powerOn = util::isPoweredOn(bus); } void PowerSupply::checkInputFault(const uint16_t statusWord) { using namespace phosphor::pmbus; if ((inputFault < FAULT_COUNT) && ((statusWord & status_word::INPUT_FAULT_WARN) || (statusWord & status_word::VIN_UV_FAULT))) { if (inputFault == 0) { log("INPUT or VIN_UV fault", entry("STATUS_WORD=0x%04X", statusWord)); } inputFault++; } else { if ((inputFault > 0) && !(statusWord & status_word::INPUT_FAULT_WARN) && !(statusWord & status_word::VIN_UV_FAULT)) { inputFault = 0; faultFound = false; // When an input fault occurs, the power supply cannot be on. // However, the check for the case where the power supply should be // on will stop when there is a fault found. // Clear the powerOnFault when the inputFault is cleared to reset // the powerOnFault de-glitching. powerOnFault = 0; log("INPUT_FAULT_WARN cleared", entry("POWERSUPPLY=%s", inventoryPath.c_str())); resolveError(inventoryPath, std::string(PowerSupplyInputFault::errName)); if (powerOn) { // The power supply will not be immediately powered on after // the input power is restored. powerOn = false; // Start up the timer that will set the state to indicate we // are ready for the powered on fault checks. powerOnTimer.restartOnce(powerOnInterval); } } } if (!faultFound && (inputFault >= FAULT_COUNT)) { // If the power is on, report the fault in an error log entry. if (powerOn) { util::NamesValues nv; nv.add("STATUS_WORD", statusWord); captureCmd(nv, STATUS_INPUT, Type::Debug); using metadata = org::open_power::Witherspoon::Fault::PowerSupplyInputFault; report( metadata::RAW_STATUS(nv.get().c_str()), metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str())); faultFound = true; } } } void PowerSupply::checkPGOrUnitOffFault(const uint16_t statusWord) { using namespace phosphor::pmbus; if (powerOnFault < FAULT_COUNT) { // Check PG# and UNIT_IS_OFF if ((statusWord & status_word::POWER_GOOD_NEGATED) || (statusWord & status_word::UNIT_IS_OFF)) { log("PGOOD or UNIT_IS_OFF bit bad", entry("STATUS_WORD=0x%04X", statusWord)); powerOnFault++; } else { if (powerOnFault > 0) { log("PGOOD and UNIT_IS_OFF bits good"); powerOnFault = 0; } } if (!faultFound && (powerOnFault >= FAULT_COUNT)) { faultFound = true; util::NamesValues nv; nv.add("STATUS_WORD", statusWord); captureCmd(nv, STATUS_INPUT, Type::Debug); auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0); captureCmd(nv, status0Vout, Type::Debug); captureCmd(nv, STATUS_IOUT, Type::Debug); captureCmd(nv, STATUS_MFR, Type::Debug); using metadata = org::open_power::Witherspoon::Fault::PowerSupplyShouldBeOn; // A power supply is OFF (or pgood low) but should be on. report( metadata::RAW_STATUS(nv.get().c_str()), metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str())); } } } void PowerSupply::checkCurrentOutOverCurrentFault(const uint16_t statusWord) { using namespace phosphor::pmbus; if (outputOCFault < FAULT_COUNT) { // Check for an output overcurrent fault. if ((statusWord & status_word::IOUT_OC_FAULT)) { outputOCFault++; } else { if (outputOCFault > 0) { outputOCFault = 0; } } if (!faultFound && (outputOCFault >= FAULT_COUNT)) { util::NamesValues nv; nv.add("STATUS_WORD", statusWord); captureCmd(nv, STATUS_INPUT, Type::Debug); auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0); captureCmd(nv, status0Vout, Type::Debug); captureCmd(nv, STATUS_IOUT, Type::Debug); captureCmd(nv, STATUS_MFR, Type::Debug); using metadata = org::open_power::Witherspoon::Fault:: PowerSupplyOutputOvercurrent; report( metadata::RAW_STATUS(nv.get().c_str()), metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str())); faultFound = true; } } } void PowerSupply::checkOutputOvervoltageFault(const uint16_t statusWord) { using namespace phosphor::pmbus; if (outputOVFault < FAULT_COUNT) { // Check for an output overvoltage fault. if (statusWord & status_word::VOUT_OV_FAULT) { outputOVFault++; } else { if (outputOVFault > 0) { outputOVFault = 0; } } if (!faultFound && (outputOVFault >= FAULT_COUNT)) { util::NamesValues nv; nv.add("STATUS_WORD", statusWord); captureCmd(nv, STATUS_INPUT, Type::Debug); auto status0Vout = pmbusIntf.insertPageNum(STATUS_VOUT, 0); captureCmd(nv, status0Vout, Type::Debug); captureCmd(nv, STATUS_IOUT, Type::Debug); captureCmd(nv, STATUS_MFR, Type::Debug); using metadata = org::open_power::Witherspoon::Fault:: PowerSupplyOutputOvervoltage; report( metadata::RAW_STATUS(nv.get().c_str()), metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str())); faultFound = true; } } } void PowerSupply::checkFanFault(const uint16_t statusWord) { using namespace phosphor::pmbus; if (fanFault < FAULT_COUNT) { // Check for a fan fault or warning condition if (statusWord & status_word::FAN_FAULT) { fanFault++; } else { if (fanFault > 0) { fanFault = 0; } } if (!faultFound && (fanFault >= FAULT_COUNT)) { util::NamesValues nv; nv.add("STATUS_WORD", statusWord); captureCmd(nv, STATUS_MFR, Type::Debug); captureCmd(nv, STATUS_TEMPERATURE, Type::Debug); captureCmd(nv, STATUS_FANS_1_2, Type::Debug); using metadata = org::open_power::Witherspoon::Fault::PowerSupplyFanFault; report( metadata::RAW_STATUS(nv.get().c_str()), metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str())); faultFound = true; } } } void PowerSupply::checkTemperatureFault(const uint16_t statusWord) { using namespace phosphor::pmbus; // Due to how the PMBus core device driver sends a clear faults command // the bit in STATUS_WORD will likely be cleared when we attempt to examine // it for a Thermal Fault or Warning. So, check the STATUS_WORD and the // STATUS_TEMPERATURE bits. If either indicates a fault, proceed with // logging the over-temperature condition. std::uint8_t statusTemperature = 0; statusTemperature = pmbusIntf.read(STATUS_TEMPERATURE, Type::Debug); if (temperatureFault < FAULT_COUNT) { if ((statusWord & status_word::TEMPERATURE_FAULT_WARN) || (statusTemperature & status_temperature::OT_FAULT)) { temperatureFault++; } else { if (temperatureFault > 0) { temperatureFault = 0; } } if (!faultFound && (temperatureFault >= FAULT_COUNT)) { // The power supply has had an over-temperature condition. // This may not result in a shutdown if experienced for a short // duration. // This should not occur under normal conditions. // The power supply may be faulty, or the paired supply may be // putting out less current. // Capture command responses with potentially relevant information, // and call out the power supply reporting the condition. util::NamesValues nv; nv.add("STATUS_WORD", statusWord); captureCmd(nv, STATUS_MFR, Type::Debug); captureCmd(nv, STATUS_IOUT, Type::Debug); nv.add("STATUS_TEMPERATURE", statusTemperature); captureCmd(nv, STATUS_FANS_1_2, Type::Debug); using metadata = org::open_power::Witherspoon::Fault:: PowerSupplyTemperatureFault; report( metadata::RAW_STATUS(nv.get().c_str()), metadata::CALLOUT_INVENTORY_PATH(inventoryPath.c_str())); faultFound = true; } } } void PowerSupply::clearFaults() { readFail = 0; readFailLogged = false; inputFault = 0; powerOnFault = 0; outputOCFault = 0; outputOVFault = 0; fanFault = 0; temperatureFault = 0; faultFound = false; return; } void PowerSupply::resolveError(const std::string& callout, const std::string& message) { using EndpointList = std::vector; try { auto path = callout + "/fault"; // Get the service name from the mapper for the fault callout auto service = util::getService(path, ASSOCIATION_IFACE, bus); // Use getProperty utility function to get log entries (endpoints) EndpointList logEntries; util::getProperty(ASSOCIATION_IFACE, ENDPOINTS_PROP, path, service, bus, logEntries); // It is possible that all such entries for this callout have since // been deleted. if (logEntries.empty()) { return; } auto logEntryService = util::getService(logEntries[0], LOGGING_IFACE, bus); if (logEntryService.empty()) { return; } // go through each log entry that matches this callout path std::string logMessage; for (const auto& logEntry : logEntries) { // Check to see if this logEntry has a message that matches. util::getProperty(LOGGING_IFACE, MESSAGE_PROP, logEntry, logEntryService, bus, logMessage); if (message == logMessage) { // Log entry matches call out and message, set Resolved to true bool resolved = true; util::setProperty(LOGGING_IFACE, RESOLVED_PROP, logEntry, logEntryService, bus, resolved); } } } catch (const std::exception& e) { log("Failed to resolve error", entry("CALLOUT=%s", callout.c_str()), entry("ERROR=%s", message.c_str())); } } void PowerSupply::updateInventory() { using namespace phosphor::pmbus; using namespace sdbusplus::message; // Build the object map and send it to the inventory using Properties = std::map>; using Interfaces = std::map; using Object = std::map; Properties assetProps; Properties operProps; Interfaces interfaces; Object object; // If any of these accesses fail, the fields will just be // blank in the inventory. Leave logging ReadFailure errors // to analyze() as it runs continuously and will most // likely hit and threshold them first anyway. The // readString() function will do the tracing of the failing // path so this code doesn't need to. for (const auto& fru : fruJson.at("fruConfigs")) { if (fru.at("interface") == ASSET_IFACE) { try { assetProps.emplace( fru.at("propertyName"), present ? pmbusIntf.readString(fru.at("fileName"), inventoryPMBusAccessType) : ""); } catch (const ReadFailure& e) {} } } operProps.emplace(FUNCTIONAL_PROP, present); interfaces.emplace(ASSET_IFACE, std::move(assetProps)); interfaces.emplace(OPERATIONAL_STATE_IFACE, std::move(operProps)); // For Notify(), just send the relative path of the inventory // object so remove the INVENTORY_OBJ_PATH prefix auto path = inventoryPath.substr(strlen(INVENTORY_OBJ_PATH)); object.emplace(path, std::move(interfaces)); try { auto service = util::getService(INVENTORY_OBJ_PATH, INVENTORY_MGR_IFACE, bus); if (service.empty()) { log("Unable to get inventory manager service"); return; } auto method = bus.new_method_call(service.c_str(), INVENTORY_OBJ_PATH, INVENTORY_MGR_IFACE, "Notify"); method.append(std::move(object)); auto reply = bus.call(method); } catch (const std::exception& e) { log(e.what(), entry("PATH=%s", inventoryPath.c_str())); } } void PowerSupply::syncHistory() { using namespace phosphor::gpio; if (syncGPIODevPath.empty()) { // Sync not implemented return; } GPIO gpio{syncGPIODevPath, static_cast(syncGPIONumber), Direction::output}; try { gpio.set(Value::low); std::this_thread::sleep_for(std::chrono::milliseconds{5}); gpio.set(Value::high); recordManager->clear(); } catch (const std::exception& e) { // Do nothing. There would already be a journal entry. } } void PowerSupply::enableHistory(const std::string& objectPath, size_t numRecords, const std::string& syncGPIOPath, size_t syncGPIONum) { historyObjectPath = objectPath; syncGPIODevPath = syncGPIOPath; syncGPIONumber = syncGPIONum; recordManager = std::make_unique(numRecords); auto avgPath = historyObjectPath + '/' + history::Average::name; auto maxPath = historyObjectPath + '/' + history::Maximum::name; average = std::make_unique(bus, avgPath); maximum = std::make_unique(bus, maxPath); } void PowerSupply::updateHistory() { if (!recordManager) { // Not enabled return; } // Read just the most recent average/max record auto data = pmbusIntf.readBinary(INPUT_HISTORY, pmbus::Type::HwmonDeviceDebug, history::RecordManager::RAW_RECORD_SIZE); // Update D-Bus only if something changed (a new record ID, or cleared out) auto changed = recordManager->add(data); if (changed) { average->values(std::move(recordManager->getAverageRecords())); maximum->values(std::move(recordManager->getMaximumRecords())); } } } // namespace psu } // namespace power } // namespace phosphor