xref: /openbmc/phosphor-logging/extensions/openpower-pels/manager.cpp (revision b6d3e2fc727801053925d99081486989fc320900)
1 /**
2  * Copyright © 2019 IBM Corporation
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *     http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 #include "manager.hpp"
17 
18 #include "additional_data.hpp"
19 #include "elog_serialize.hpp"
20 #include "json_utils.hpp"
21 #include "pel.hpp"
22 #include "pel_entry.hpp"
23 #include "service_indicators.hpp"
24 #include "severity.hpp"
25 
26 #include <sys/inotify.h>
27 #include <unistd.h>
28 
29 #include <phosphor-logging/lg2.hpp>
30 #include <xyz/openbmc_project/Common/error.hpp>
31 #include <xyz/openbmc_project/Logging/Create/server.hpp>
32 
33 #include <filesystem>
34 #include <format>
35 #include <fstream>
36 #include <locale>
37 
38 namespace openpower
39 {
40 namespace pels
41 {
42 
43 using namespace phosphor::logging;
44 namespace fs = std::filesystem;
45 namespace rg = openpower::pels::message;
46 
47 namespace common_error = sdbusplus::xyz::openbmc_project::Common::Error;
48 
49 using Create = sdbusplus::server::xyz::openbmc_project::logging::Create;
50 
51 namespace additional_data
52 {
53 constexpr auto rawPEL = "RAWPEL";
54 constexpr auto esel = "ESEL";
55 constexpr auto error = "ERROR_NAME";
56 } // namespace additional_data
57 
58 constexpr auto defaultLogMessage = "xyz.openbmc_project.Logging.Error.Default";
59 constexpr uint32_t bmcThermalCompID = 0x2700;
60 constexpr uint32_t bmcFansCompID = 0x2800;
61 
~Manager()62 Manager::~Manager()
63 {
64     if (_pelFileDeleteFD != -1)
65     {
66         if (_pelFileDeleteWatchFD != -1)
67         {
68             inotify_rm_watch(_pelFileDeleteFD, _pelFileDeleteWatchFD);
69         }
70         close(_pelFileDeleteFD);
71     }
72 }
73 
create(const std::string & message,uint32_t obmcLogID,uint64_t timestamp,Entry::Level severity,const std::map<std::string,std::string> & additionalData,const std::vector<std::string> & associations,const FFDCEntries & ffdc)74 void Manager::create(const std::string& message, uint32_t obmcLogID,
75                      uint64_t timestamp, Entry::Level severity,
76                      const std::map<std::string, std::string>& additionalData,
77                      const std::vector<std::string>& associations,
78                      const FFDCEntries& ffdc)
79 {
80     AdditionalData ad{additionalData};
81 
82     // If a PEL was passed in via a filename or in an ESEL,
83     // use that.  Otherwise, create one.
84     auto rawPelPath = ad.getValue(additional_data::rawPEL);
85     if (rawPelPath)
86     {
87         addRawPEL(*rawPelPath, obmcLogID);
88     }
89     else
90     {
91         auto esel = ad.getValue(additional_data::esel);
92         if (esel)
93         {
94             addESELPEL(*esel, obmcLogID);
95         }
96         else
97         {
98             createPEL(message, obmcLogID, timestamp, severity, additionalData,
99                       associations, ffdc);
100         }
101     }
102 
103     setEntryPath(obmcLogID);
104     setServiceProviderNotifyFlag(obmcLogID);
105 }
106 
addRawPEL(const std::string & rawPelPath,uint32_t obmcLogID)107 void Manager::addRawPEL(const std::string& rawPelPath, uint32_t obmcLogID)
108 {
109     if (fs::exists(rawPelPath))
110     {
111         std::ifstream file(rawPelPath, std::ios::in | std::ios::binary);
112 
113         auto data = std::vector<uint8_t>(std::istreambuf_iterator<char>(file),
114                                          std::istreambuf_iterator<char>());
115         if (file.fail())
116         {
117             lg2::error(
118                 "Filesystem error reading a raw PEL. File = {FILE}, obmcLogID = {LOGID}",
119                 "FILE", rawPelPath, "LOGID", obmcLogID);
120             // TODO, Decide what to do here. Maybe nothing.
121             return;
122         }
123 
124         file.close();
125 
126         addPEL(data, obmcLogID);
127 
128         std::error_code ec;
129         fs::remove(rawPelPath, ec);
130     }
131     else
132     {
133         lg2::error(
134             "Raw PEL file from BMC event log does not exit. File = {FILE}, obmcLogID = {LOGID}",
135             "FILE", rawPelPath, "LOGID", obmcLogID);
136     }
137 }
138 
addPEL(std::vector<uint8_t> & pelData,uint32_t obmcLogID)139 void Manager::addPEL(std::vector<uint8_t>& pelData, uint32_t obmcLogID)
140 {
141     auto pel = std::make_unique<openpower::pels::PEL>(pelData, obmcLogID);
142     if (pel->valid())
143     {
144         // PELs created by others still need this field set by us.
145         pel->setCommitTime();
146 
147         // Assign Id other than to Hostbot PEL
148         if ((pel->privateHeader()).creatorID() !=
149             static_cast<uint8_t>(CreatorID::hostboot))
150         {
151             pel->assignID();
152         }
153         else
154         {
155             const Repository::LogID id{Repository::LogID::Pel(pel->id())};
156             auto result = _repo.hasPEL(id);
157             if (result)
158             {
159                 lg2::warning(
160                     "Duplicate HostBoot PEL ID {ID} found, moving it to archive folder",
161                     "ID", lg2::hex, pel->id());
162 
163                 _repo.archivePEL(*pel);
164 
165                 // No need to keep around the openBMC event log entry
166                 scheduleObmcLogDelete(obmcLogID);
167                 return;
168             }
169         }
170 
171         // Update System Info to Extended User Data
172         pel->updateSysInfoInExtendedUserDataSection(*_dataIface);
173 
174         // Check for severity 0x51 and update boot progress SRC
175         updateProgressSRC(pel);
176 
177         try
178         {
179             lg2::debug("Adding external PEL {ID} (BMC ID {BMCID}) to repo",
180                        "ID", lg2::hex, pel->id(), "BMCID", obmcLogID);
181             _repo.add(pel);
182 
183             if (_repo.sizeWarning())
184             {
185                 scheduleRepoPrune();
186             }
187 
188             // Activate any resulting service indicators if necessary
189             auto policy = service_indicators::getPolicy(*_dataIface);
190             policy->activate(*pel);
191         }
192         catch (const std::exception& e)
193         {
194             // Probably a full or r/o filesystem, not much we can do.
195             lg2::error("Unable to add PEL {ID} to Repository", "ID", lg2::hex,
196                        pel->id());
197         }
198 
199         updateEventId(pel);
200         updateResolution(*pel);
201         serializeLogEntry(obmcLogID);
202         createPELEntry(obmcLogID);
203 
204         // Check if firmware should quiesce system due to error
205         checkPelAndQuiesce(pel);
206     }
207     else
208     {
209         lg2::error("Invalid PEL received from the host. BMC ID = {ID}", "ID",
210                    obmcLogID);
211 
212         AdditionalData ad;
213         ad.add("PLID", getNumberString("0x%08X", pel->plid()));
214         ad.add("OBMC_LOG_ID", std::to_string(obmcLogID));
215         ad.add("PEL_SIZE", std::to_string(pelData.size()));
216 
217         std::string asciiString;
218         auto src = pel->primarySRC();
219         if (src)
220         {
221             asciiString = (*src)->asciiString();
222         }
223 
224         ad.add("SRC", asciiString);
225 
226         _eventLogger.log("org.open_power.Logging.Error.BadHostPEL",
227                          Entry::Level::Error, ad);
228 
229         // Save it to a file for debug in the lab.  Just keep the latest.
230         // Not adding it to the PEL because it could already be max size
231         // and don't want to truncate an already invalid PEL.
232         std::ofstream pelFile{getPELRepoPath() / "badPEL"};
233         pelFile.write(reinterpret_cast<const char*>(pelData.data()),
234                       pelData.size());
235 
236         // No need to keep around the openBMC event log entry
237         scheduleObmcLogDelete(obmcLogID);
238     }
239 }
240 
addESELPEL(const std::string & esel,uint32_t obmcLogID)241 void Manager::addESELPEL(const std::string& esel, uint32_t obmcLogID)
242 {
243     std::vector<uint8_t> data;
244 
245     lg2::debug("Adding PEL from ESEL. BMC ID = {ID}", "ID", obmcLogID);
246 
247     try
248     {
249         data = std::move(eselToRawData(esel));
250     }
251     catch (const std::exception& e)
252     {
253         // Try to add it below anyway, so it follows the usual bad data path.
254         lg2::error("Problems converting ESEL string to a byte vector");
255     }
256 
257     addPEL(data, obmcLogID);
258 }
259 
eselToRawData(const std::string & esel)260 std::vector<uint8_t> Manager::eselToRawData(const std::string& esel)
261 {
262     std::vector<uint8_t> data;
263     std::string byteString;
264 
265     // As the eSEL string looks like: "50 48 00 ab ..." there are 3
266     // characters per raw byte, and since the actual PEL data starts
267     // at the 16th byte, the code will grab the PEL data starting at
268     // offset 48 in the string.
269     static constexpr size_t pelStart = 16 * 3;
270 
271     if (esel.size() <= pelStart)
272     {
273         lg2::error("ESEL data too short, length = {LEN}", "LEN", esel.size());
274         throw std::length_error("ESEL data too short");
275     }
276 
277     for (size_t i = pelStart; i < esel.size(); i += 3)
278     {
279         if (i + 1 < esel.size())
280         {
281             byteString = esel.substr(i, 2);
282             data.push_back(std::stoi(byteString, nullptr, 16));
283         }
284         else
285         {
286             lg2::error("ESEL data too short, length = {LEN}", "LEN",
287                        esel.size());
288             throw std::length_error("ESEL data too short");
289         }
290     }
291 
292     return data;
293 }
294 
erase(uint32_t obmcLogID)295 void Manager::erase(uint32_t obmcLogID)
296 {
297     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
298 
299     auto path = std::string(OBJ_ENTRY) + '/' + std::to_string(obmcLogID);
300     _pelEntries.erase(path);
301     _repo.remove(id);
302 }
303 
getLogIDWithHwIsolation(std::vector<uint32_t> & idsWithHwIsoEntry)304 void Manager::getLogIDWithHwIsolation(std::vector<uint32_t>& idsWithHwIsoEntry)
305 {
306     idsWithHwIsoEntry = _dataIface->getLogIDWithHwIsolation();
307 }
308 
isDeleteProhibited(uint32_t obmcLogID)309 bool Manager::isDeleteProhibited(uint32_t obmcLogID)
310 {
311     auto entryPath{std::string(OBJ_ENTRY) + '/' + std::to_string(obmcLogID)};
312     auto entry = _pelEntries.find(entryPath);
313     if (entry != _pelEntries.end())
314     {
315         if (entry->second->guard())
316         {
317             auto hwIsolationAssocPaths = _dataIface->getAssociatedPaths(
318                 entryPath += "/isolated_hw_entry", "/", 0,
319                 {"xyz.openbmc_project.HardwareIsolation.Entry"});
320             if (!hwIsolationAssocPaths.empty())
321             {
322                 return true;
323             }
324         }
325     }
326     return false;
327 }
328 
convertToPelFFDC(const FFDCEntries & ffdc)329 PelFFDC Manager::convertToPelFFDC(const FFDCEntries& ffdc)
330 {
331     PelFFDC pelFFDC;
332 
333     std::for_each(ffdc.begin(), ffdc.end(), [&pelFFDC](const auto& f) {
334         PelFFDCfile pf;
335         pf.subType = std::get<ffdcSubtypePos>(f);
336         pf.version = std::get<ffdcVersionPos>(f);
337         pf.fd = std::get<ffdcFDPos>(f);
338 
339         switch (std::get<ffdcFormatPos>(f))
340         {
341             case Create::FFDCFormat::JSON:
342                 pf.format = UserDataFormat::json;
343                 break;
344             case Create::FFDCFormat::CBOR:
345                 pf.format = UserDataFormat::cbor;
346                 break;
347             case Create::FFDCFormat::Text:
348                 pf.format = UserDataFormat::text;
349                 break;
350             case Create::FFDCFormat::Custom:
351                 pf.format = UserDataFormat::custom;
352                 break;
353         }
354 
355         pelFFDC.push_back(pf);
356     });
357 
358     return pelFFDC;
359 }
360 
createPEL(const std::string & message,uint32_t obmcLogID,uint64_t timestamp,phosphor::logging::Entry::Level severity,const std::map<std::string,std::string> & additionalData,const std::vector<std::string> &,const FFDCEntries & ffdc)361 void Manager::createPEL(
362     const std::string& message, uint32_t obmcLogID, uint64_t timestamp,
363     phosphor::logging::Entry::Level severity,
364     const std::map<std::string, std::string>& additionalData,
365     const std::vector<std::string>& /*associations*/, const FFDCEntries& ffdc)
366 {
367     auto entry = _registry.lookup(message, rg::LookupType::name);
368     auto pelFFDC = convertToPelFFDC(ffdc);
369     AdditionalData ad{additionalData};
370     std::string msg;
371 
372     if (!entry)
373     {
374         // Instead, get the default entry that means there is no
375         // other matching entry.  This error will still use the
376         // AdditionalData values of the original error, and this
377         // code will add the error message value that wasn't found
378         // to this AD.  This way, there will at least be a PEL,
379         // possibly with callouts, to allow users to debug the
380         // issue that caused the error even without its own PEL.
381         lg2::error("Event not found in PEL message registry: {MSG}", "MSG",
382                    message);
383 
384         entry = _registry.lookup(defaultLogMessage, rg::LookupType::name);
385         if (!entry)
386         {
387             lg2::error("Default event not found in PEL message registry");
388             return;
389         }
390 
391         ad.add(additional_data::error, message);
392     }
393 
394     auto pel = std::make_unique<openpower::pels::PEL>(
395         *entry, obmcLogID, timestamp, severity, ad, pelFFDC, *_dataIface,
396         *_journal);
397 
398     _repo.add(pel);
399 
400     if (_repo.sizeWarning())
401     {
402         scheduleRepoPrune();
403     }
404 
405     auto src = pel->primarySRC();
406     if (src)
407     {
408         auto asciiString = (*src)->asciiString();
409         while (asciiString.back() == ' ')
410         {
411             asciiString.pop_back();
412         }
413         lg2::info("Created PEL {ID} (BMC ID {BMCID}) with SRC {SRC}", "ID",
414                   lg2::hex, pel->id(), "BMCID", pel->obmcLogID(), "SRC",
415                   asciiString);
416     }
417 
418     // Check for severity 0x51 and update boot progress SRC
419     updateProgressSRC(pel);
420 
421     // Activate any resulting service indicators if necessary
422     auto policy = service_indicators::getPolicy(*_dataIface);
423     policy->activate(*pel);
424 
425     updateDBusSeverity(*pel);
426     updateEventId(pel);
427     updateResolution(*pel);
428     serializeLogEntry(obmcLogID);
429     createPELEntry(obmcLogID);
430 
431     // Check if firmware should quiesce system due to error
432     checkPelAndQuiesce(pel);
433 }
434 
getPEL(uint32_t pelID)435 sdbusplus::message::unix_fd Manager::getPEL(uint32_t pelID)
436 {
437     Repository::LogID id{Repository::LogID::Pel(pelID)};
438     std::optional<int> fd;
439 
440     lg2::debug("getPEL {ID}", "ID", lg2::hex, pelID);
441 
442     try
443     {
444         fd = _repo.getPELFD(id);
445     }
446     catch (const std::exception& e)
447     {
448         throw common_error::InternalFailure();
449     }
450 
451     if (!fd)
452     {
453         throw common_error::InvalidArgument();
454     }
455 
456     scheduleFDClose(*fd);
457 
458     return *fd;
459 }
460 
scheduleFDClose(int fd)461 void Manager::scheduleFDClose(int fd)
462 {
463     _fdCloserEventSource = std::make_unique<sdeventplus::source::Defer>(
464         _event, std::bind(std::mem_fn(&Manager::closeFD), this, fd,
465                           std::placeholders::_1));
466 }
467 
closeFD(int fd,sdeventplus::source::EventBase &)468 void Manager::closeFD(int fd, sdeventplus::source::EventBase& /*source*/)
469 {
470     close(fd);
471     _fdCloserEventSource.reset();
472 }
473 
getPELFromOBMCID(uint32_t obmcLogID)474 std::vector<uint8_t> Manager::getPELFromOBMCID(uint32_t obmcLogID)
475 {
476     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
477     std::optional<std::vector<uint8_t>> data;
478 
479     lg2::debug("getPELFromOBMCID  {BMCID}", "BMCID", obmcLogID);
480 
481     try
482     {
483         data = _repo.getPELData(id);
484     }
485     catch (const std::exception& e)
486     {
487         throw common_error::InternalFailure();
488     }
489 
490     if (!data)
491     {
492         throw common_error::InvalidArgument();
493     }
494 
495     return *data;
496 }
497 
hostAck(uint32_t pelID)498 void Manager::hostAck(uint32_t pelID)
499 {
500     Repository::LogID id{Repository::LogID::Pel(pelID)};
501 
502     lg2::debug("HostHack {ID}", "ID", lg2::hex, pelID);
503 
504     if (!_repo.hasPEL(id))
505     {
506         throw common_error::InvalidArgument();
507     }
508 
509     if (_hostNotifier)
510     {
511         _hostNotifier->ackPEL(pelID);
512     }
513 }
514 
hostReject(uint32_t pelID,RejectionReason reason)515 void Manager::hostReject(uint32_t pelID, RejectionReason reason)
516 {
517     Repository::LogID id{Repository::LogID::Pel(pelID)};
518 
519     lg2::debug("HostReject {ID}, reason = {REASON}", "ID", lg2::hex, pelID,
520                "REASON", reason);
521 
522     if (!_repo.hasPEL(id))
523     {
524         throw common_error::InvalidArgument();
525     }
526 
527     if (reason == RejectionReason::BadPEL)
528     {
529         AdditionalData data;
530         data.add("BAD_ID", getNumberString("0x%08X", pelID));
531         _eventLogger.log("org.open_power.Logging.Error.SentBadPELToHost",
532                          Entry::Level::Informational, data);
533         if (_hostNotifier)
534         {
535             _hostNotifier->setBadPEL(pelID);
536         }
537     }
538     else if ((reason == RejectionReason::HostFull) && _hostNotifier)
539     {
540         _hostNotifier->setHostFull(pelID);
541     }
542 }
543 
scheduleRepoPrune()544 void Manager::scheduleRepoPrune()
545 {
546     _repoPrunerEventSource = std::make_unique<sdeventplus::source::Defer>(
547         _event, std::bind(std::mem_fn(&Manager::pruneRepo), this,
548                           std::placeholders::_1));
549 }
550 
pruneRepo(sdeventplus::source::EventBase &)551 void Manager::pruneRepo(sdeventplus::source::EventBase& /*source*/)
552 {
553     auto idsWithHwIsoEntry = _dataIface->getLogIDWithHwIsolation();
554 
555     auto idsToDelete = _repo.prune(idsWithHwIsoEntry);
556 
557     // Remove the OpenBMC event logs for the PELs that were just removed.
558     std::for_each(idsToDelete.begin(), idsToDelete.end(),
559                   [this](auto id) { this->_logManager.erase(id); });
560 
561     _repoPrunerEventSource.reset();
562 }
563 
setupPELDeleteWatch()564 void Manager::setupPELDeleteWatch()
565 {
566     _pelFileDeleteFD = inotify_init1(IN_NONBLOCK);
567     if (-1 == _pelFileDeleteFD)
568     {
569         auto e = errno;
570         lg2::error("inotify_init1 failed with errno {ERRNO}", "ERRNO", e);
571         abort();
572     }
573 
574     _pelFileDeleteWatchFD = inotify_add_watch(
575         _pelFileDeleteFD, _repo.repoPath().c_str(), IN_DELETE);
576     if (-1 == _pelFileDeleteWatchFD)
577     {
578         auto e = errno;
579         lg2::error("inotify_add_watch failed with errno {ERRNO}", "ERRNO", e);
580         abort();
581     }
582 
583     _pelFileDeleteEventSource = std::make_unique<sdeventplus::source::IO>(
584         _event, _pelFileDeleteFD, EPOLLIN,
585         std::bind(std::mem_fn(&Manager::pelFileDeleted), this,
586                   std::placeholders::_1, std::placeholders::_2,
587                   std::placeholders::_3));
588 }
589 
pelFileDeleted(sdeventplus::source::IO &,int,uint32_t revents)590 void Manager::pelFileDeleted(sdeventplus::source::IO& /*io*/, int /*fd*/,
591                              uint32_t revents)
592 {
593     if (!(revents & EPOLLIN))
594     {
595         return;
596     }
597 
598     // An event for 1 PEL uses 48B. When all PELs are deleted at once,
599     // as many events as there is room for can be handled in one callback.
600     // A size of 2000 will allow 41 to be processed, with additional
601     // callbacks being needed to process the remaining ones.
602     std::array<uint8_t, 2000> data{};
603     auto bytesRead = read(_pelFileDeleteFD, data.data(), data.size());
604     if (bytesRead < 0)
605     {
606         auto e = errno;
607         lg2::error("Failed reading data from inotify event, errno = {ERRNO}",
608                    "ERRNO", e);
609         abort();
610     }
611 
612     auto offset = 0;
613     while (offset < bytesRead)
614     {
615         auto event = reinterpret_cast<inotify_event*>(&data[offset]);
616         if (event->mask & IN_DELETE)
617         {
618             std::string filename{event->name};
619 
620             // Get the PEL ID from the filename and tell the
621             // repo it's been removed, and then delete the BMC
622             // event log if it's there.
623             auto pos = filename.find_first_of('_');
624             if (pos != std::string::npos)
625             {
626                 try
627                 {
628                     auto idString = filename.substr(pos + 1);
629                     auto pelID = std::stoul(idString, nullptr, 16);
630 
631                     Repository::LogID id{Repository::LogID::Pel(pelID)};
632                     auto removedLogID = _repo.remove(id);
633                     if (removedLogID)
634                     {
635                         _logManager.erase(removedLogID->obmcID.id);
636                     }
637                 }
638                 catch (const std::exception& e)
639                 {
640                     lg2::info("Could not find PEL ID from its filename {NAME}",
641                               "NAME", filename);
642                 }
643             }
644         }
645 
646         offset += offsetof(inotify_event, name) + event->len;
647     }
648 }
649 
createPELWithFFDCFiles(std::string message,Entry::Level severity,std::map<std::string,std::string> additionalData,std::vector<std::tuple<sdbusplus::server::xyz::openbmc_project::logging::Create::FFDCFormat,uint8_t,uint8_t,sdbusplus::message::unix_fd>> fFDC)650 std::tuple<uint32_t, uint32_t> Manager::createPELWithFFDCFiles(
651     std::string message, Entry::Level severity,
652     std::map<std::string, std::string> additionalData,
653     std::vector<std::tuple<
654         sdbusplus::server::xyz::openbmc_project::logging::Create::FFDCFormat,
655         uint8_t, uint8_t, sdbusplus::message::unix_fd>>
656         fFDC)
657 {
658     _logManager.create(message, severity, additionalData, fFDC);
659 
660     return {_logManager.lastEntryID(), _repo.lastPelID()};
661 }
662 
getPELJSON(uint32_t obmcLogID)663 std::string Manager::getPELJSON(uint32_t obmcLogID)
664 {
665     // Throws InvalidArgument if not found
666     auto pelID = getPELIdFromBMCLogId(obmcLogID);
667 
668     auto cmd = std::format("/usr/bin/peltool -i {:#x}", pelID);
669 
670     FILE* pipe = popen(cmd.c_str(), "r");
671     if (!pipe)
672     {
673         lg2::error("Error running cmd: {CMD}", "CMD", cmd);
674         throw common_error::InternalFailure();
675     }
676 
677     std::string output;
678     std::array<char, 1024> buffer;
679     while (fgets(buffer.data(), buffer.size(), pipe) != nullptr)
680     {
681         output.append(buffer.data());
682     }
683 
684     int rc = pclose(pipe);
685     if (WEXITSTATUS(rc) != 0)
686     {
687         lg2::error("Error running cmd: {CMD}, rc = {RC}", "CMD", cmd, "RC", rc);
688         throw common_error::InternalFailure();
689     }
690 
691     return output;
692 }
693 
checkPelAndQuiesce(std::unique_ptr<openpower::pels::PEL> & pel)694 void Manager::checkPelAndQuiesce(std::unique_ptr<openpower::pels::PEL>& pel)
695 {
696     if ((pel->userHeader().severity() ==
697          static_cast<uint8_t>(SeverityType::nonError)) ||
698         (pel->userHeader().severity() ==
699          static_cast<uint8_t>(SeverityType::recovered)))
700     {
701         lg2::debug(
702             "PEL severity informational or recovered. no quiesce needed");
703         return;
704     }
705     if (!_logManager.isQuiesceOnErrorEnabled())
706     {
707         lg2::debug("QuiesceOnHwError not enabled, no quiesce needed");
708         return;
709     }
710 
711     CreatorID creatorID{pel->privateHeader().creatorID()};
712 
713     if ((creatorID != CreatorID::openBMC) &&
714         (creatorID != CreatorID::hostboot) &&
715         (creatorID != CreatorID::ioDrawer) && (creatorID != CreatorID::occ) &&
716         (creatorID != CreatorID::phyp))
717     {
718         return;
719     }
720 
721     // Now check if it has any type of callout
722     if (pel->isHwCalloutPresent())
723     {
724         lg2::info(
725             "QuiesceOnHwError enabled, PEL severity not nonError or recovered, "
726             "and callout is present");
727 
728         _logManager.quiesceOnError(pel->obmcLogID());
729     }
730 }
731 
getEventId(const openpower::pels::PEL & pel) const732 std::string Manager::getEventId(const openpower::pels::PEL& pel) const
733 {
734     std::string str;
735     auto src = pel.primarySRC();
736     if (src)
737     {
738         const auto& hexwords = (*src)->hexwordData();
739 
740         std::string refcode = (*src)->asciiString();
741         size_t pos = refcode.find_last_not_of(0x20);
742         if (pos != std::string::npos)
743         {
744             refcode.erase(pos + 1);
745         }
746         str = refcode;
747 
748         for (auto& value : hexwords)
749         {
750             str += " ";
751             str += getNumberString("%08X", value);
752         }
753     }
754     return sanitizeFieldForDBus(str);
755 }
756 
updateEventId(std::unique_ptr<openpower::pels::PEL> & pel)757 void Manager::updateEventId(std::unique_ptr<openpower::pels::PEL>& pel)
758 {
759     std::string eventIdStr = getEventId(*pel);
760 
761     auto entryN = _logManager.entries.find(pel->obmcLogID());
762     if (entryN != _logManager.entries.end())
763     {
764         entryN->second->eventId(eventIdStr, true);
765     }
766 }
767 
sanitizeFieldForDBus(std::string field)768 std::string Manager::sanitizeFieldForDBus(std::string field)
769 {
770     std::for_each(field.begin(), field.end(), [](char& ch) {
771         if (((ch < ' ') || (ch > '~')) && (ch != '\n') && (ch != '\t'))
772         {
773             ch = ' ';
774         }
775     });
776     return field;
777 }
778 
getResolution(const openpower::pels::PEL & pel) const779 std::string Manager::getResolution(const openpower::pels::PEL& pel) const
780 {
781     std::string str;
782     std::string resolution;
783     auto src = pel.primarySRC();
784     if (src)
785     {
786         // First extract the callout pointer and then go through
787         const auto& callouts = (*src)->callouts();
788         namespace pv = openpower::pels::pel_values;
789         // All PELs dont have callout, check before parsing callout data
790         if (callouts)
791         {
792             const auto& entries = callouts->callouts();
793             // Entry starts with index 1
794             uint8_t index = 1;
795             for (auto& entry : entries)
796             {
797                 resolution += std::to_string(index) + ". ";
798                 // Adding Location code to resolution
799                 if (!entry->locationCode().empty())
800                     resolution += "Location Code: " + entry->locationCode() +
801                                   ", ";
802                 if (entry->fruIdentity())
803                 {
804                     // Get priority and set the resolution string
805                     str = pv::getValue(entry->priority(),
806                                        pel_values::calloutPriorityValues,
807                                        pel_values::registryNamePos);
808                     str[0] = toupper(str[0]);
809                     resolution += "Priority: " + str + ", ";
810                     if (entry->fruIdentity()->getPN().has_value())
811                     {
812                         resolution +=
813                             "PN: " + entry->fruIdentity()->getPN().value() +
814                             ", ";
815                     }
816                     if (entry->fruIdentity()->getSN().has_value())
817                     {
818                         resolution +=
819                             "SN: " + entry->fruIdentity()->getSN().value() +
820                             ", ";
821                     }
822                     if (entry->fruIdentity()->getCCIN().has_value())
823                     {
824                         resolution +=
825                             "CCIN: " + entry->fruIdentity()->getCCIN().value() +
826                             ", ";
827                     }
828                     // Add the maintenance procedure
829                     if (entry->fruIdentity()->getMaintProc().has_value())
830                     {
831                         resolution +=
832                             "Procedure: " +
833                             entry->fruIdentity()->getMaintProc().value() + ", ";
834                     }
835                 }
836                 resolution.resize(resolution.size() - 2);
837                 resolution += "\n";
838                 index++;
839             }
840         }
841     }
842     return sanitizeFieldForDBus(resolution);
843 }
844 
updateResolution(const openpower::pels::PEL & pel)845 bool Manager::updateResolution(const openpower::pels::PEL& pel)
846 {
847     std::string callouts = getResolution(pel);
848     auto entryN = _logManager.entries.find(pel.obmcLogID());
849     if (entryN != _logManager.entries.end())
850     {
851         entryN->second->resolution(callouts, true);
852     }
853 
854     return false;
855 }
856 
serializeLogEntry(uint32_t obmcLogID)857 void Manager::serializeLogEntry(uint32_t obmcLogID)
858 {
859     auto entryN = _logManager.entries.find(obmcLogID);
860     if (entryN != _logManager.entries.end())
861     {
862         serialize(*entryN->second);
863     }
864 }
865 
updateDBusSeverity(const openpower::pels::PEL & pel)866 void Manager::updateDBusSeverity(const openpower::pels::PEL& pel)
867 {
868     // The final severity of the PEL may not agree with the
869     // original severity of the D-Bus event log.  Update the
870     // D-Bus property to match in some cases.  This is to
871     // ensure there isn't a Critical or Warning Redfish event
872     // log for an informational or recovered PEL (or vice versa).
873     // This doesn't make an explicit call to serialize the new
874     // event log property value because updateEventId() is called
875     // right after this and will do it.
876     auto sevType =
877         static_cast<SeverityType>(pel.userHeader().severity() & 0xF0);
878 
879     auto entryN = _logManager.entries.find(pel.obmcLogID());
880     if (entryN != _logManager.entries.end())
881     {
882         auto newSeverity =
883             fixupLogSeverity(entryN->second->severity(), sevType);
884         if (newSeverity)
885         {
886             lg2::info("Changing event log {ID} severity from {OLD} "
887                       "to {NEW} to match PEL",
888                       "ID", lg2::hex, entryN->second->id(), "OLD",
889                       Entry::convertLevelToString(entryN->second->severity()),
890                       "NEW", Entry::convertLevelToString(*newSeverity));
891 
892             entryN->second->severity(*newSeverity, true);
893         }
894     }
895 }
896 
setEntryPath(uint32_t obmcLogID)897 void Manager::setEntryPath(uint32_t obmcLogID)
898 {
899     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
900     if (auto attributes = _repo.getPELAttributes(id); attributes)
901     {
902         auto& attr = attributes.value().get();
903         auto entry = _logManager.entries.find(obmcLogID);
904         if (entry != _logManager.entries.end())
905         {
906             entry->second->path(attr.path, true);
907         }
908     }
909 }
910 
setServiceProviderNotifyFlag(uint32_t obmcLogID)911 void Manager::setServiceProviderNotifyFlag(uint32_t obmcLogID)
912 {
913     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
914     if (auto attributes = _repo.getPELAttributes(id); attributes)
915     {
916         auto& attr = attributes.value().get();
917         auto entry = _logManager.entries.find(obmcLogID);
918         if (entry != _logManager.entries.end())
919         {
920             if (attr.actionFlags.test(callHomeFlagBit))
921             {
922                 entry->second->serviceProviderNotify(Entry::Notify::Notify,
923                                                      true);
924             }
925             else
926             {
927                 entry->second->serviceProviderNotify(Entry::Notify::Inhibit,
928                                                      true);
929             }
930         }
931     }
932 }
933 
createPELEntry(uint32_t obmcLogID,bool skipIaSignal)934 void Manager::createPELEntry(uint32_t obmcLogID, bool skipIaSignal)
935 {
936     std::map<std::string, PropertiesVariant> varData;
937     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
938     if (auto attributes = _repo.getPELAttributes(id); attributes)
939     {
940         namespace pv = openpower::pels::pel_values;
941         auto& attr = attributes.value().get();
942 
943         // get the hidden flag values
944         auto sevType = static_cast<SeverityType>(attr.severity & 0xF0);
945         auto isHidden = true;
946         if (((sevType != SeverityType::nonError) &&
947              attr.actionFlags.test(reportFlagBit) &&
948              !attr.actionFlags.test(hiddenFlagBit)) ||
949             ((sevType == SeverityType::nonError) &&
950              attr.actionFlags.test(serviceActionFlagBit)))
951         {
952             isHidden = false;
953         }
954         varData.emplace(std::string("Hidden"), isHidden);
955         varData.emplace(
956             std::string("Subsystem"),
957             pv::getValue(attr.subsystem, pel_values::subsystemValues));
958 
959         varData.emplace(
960             std::string("ManagementSystemAck"),
961             (attr.hmcState == TransmissionState::acked ? true : false));
962 
963         varData.emplace("PlatformLogID", attr.plid);
964         varData.emplace("Deconfig", attr.deconfig);
965         varData.emplace("Guard", attr.guard);
966         varData.emplace("Timestamp", attr.creationTime);
967 
968         // Path to create PELEntry Interface is same as PEL
969         auto path = std::string(OBJ_ENTRY) + '/' + std::to_string(obmcLogID);
970         // Create Interface for PELEntry and set properties
971         auto pelEntry = std::make_unique<PELEntry>(_logManager.getBus(), path,
972                                                    varData, obmcLogID, &_repo);
973         if (!skipIaSignal)
974         {
975             pelEntry->emit_added();
976         }
977         _pelEntries.emplace(std::move(path), std::move(pelEntry));
978     }
979 }
980 
getPELIdFromBMCLogId(uint32_t bmcLogId)981 uint32_t Manager::getPELIdFromBMCLogId(uint32_t bmcLogId)
982 {
983     Repository::LogID id{Repository::LogID::Obmc(bmcLogId)};
984     if (auto logId = _repo.getLogID(id); !logId.has_value())
985     {
986         throw common_error::InvalidArgument();
987     }
988     else
989     {
990         return logId->pelID.id;
991     }
992 }
993 
getBMCLogIdFromPELId(uint32_t pelId)994 uint32_t Manager::getBMCLogIdFromPELId(uint32_t pelId)
995 {
996     Repository::LogID id{Repository::LogID::Pel(pelId)};
997     if (auto logId = _repo.getLogID(id); !logId.has_value())
998     {
999         throw common_error::InvalidArgument();
1000     }
1001     else
1002     {
1003         return logId->obmcID.id;
1004     }
1005 }
1006 
1007 void
updateProgressSRC(std::unique_ptr<openpower::pels::PEL> & pel) const1008     Manager::updateProgressSRC(std::unique_ptr<openpower::pels::PEL>& pel) const
1009 {
1010     // Check for pel severity of type - 0x51 = critical error, system
1011     // termination
1012     if (pel->userHeader().severity() == 0x51)
1013     {
1014         auto src = pel->primarySRC();
1015         if (src)
1016         {
1017             std::vector<uint8_t> asciiSRC = (*src)->getSrcStruct();
1018             uint64_t srcRefCode = 0;
1019 
1020             // Read bytes from offset [40-47] e.g. BD8D1001
1021             for (int i = 0; i < 8; i++)
1022             {
1023                 srcRefCode |=
1024                     (static_cast<uint64_t>(asciiSRC[40 + i]) << (8 * i));
1025             }
1026 
1027             try
1028             {
1029                 _dataIface->createProgressSRC(srcRefCode, asciiSRC);
1030             }
1031             catch (const std::exception&)
1032             {
1033                 // Exception - may be no boot progress interface on dbus
1034             }
1035         }
1036     }
1037 }
1038 
scheduleObmcLogDelete(uint32_t obmcLogID)1039 void Manager::scheduleObmcLogDelete(uint32_t obmcLogID)
1040 {
1041     _obmcLogDeleteEventSource = std::make_unique<sdeventplus::source::Defer>(
1042         _event, std::bind(std::mem_fn(&Manager::deleteObmcLog), this,
1043                           std::placeholders::_1, obmcLogID));
1044 }
1045 
deleteObmcLog(sdeventplus::source::EventBase &,uint32_t obmcLogID)1046 void Manager::deleteObmcLog(sdeventplus::source::EventBase&, uint32_t obmcLogID)
1047 {
1048     lg2::info("Removing event log with no PEL: {BMCID}", "BMCID", obmcLogID);
1049     _logManager.erase(obmcLogID);
1050     _obmcLogDeleteEventSource.reset();
1051 }
1052 
clearPowerThermalDeconfigFlag(const std::string & locationCode,openpower::pels::PEL & pel)1053 bool Manager::clearPowerThermalDeconfigFlag(const std::string& locationCode,
1054                                             openpower::pels::PEL& pel)
1055 {
1056     // The requirements state that only power-thermal or
1057     // fan PELs need their deconfig flag cleared.
1058     static const std::vector<uint32_t> compIDs{bmcThermalCompID, bmcFansCompID};
1059 
1060     if (std::find(compIDs.begin(), compIDs.end(),
1061                   pel.privateHeader().header().componentID) == compIDs.end())
1062     {
1063         return false;
1064     }
1065 
1066     auto src = pel.primarySRC();
1067     const auto& callouts = (*src)->callouts();
1068     if (!callouts)
1069     {
1070         return false;
1071     }
1072 
1073     for (const auto& callout : callouts->callouts())
1074     {
1075         // Look for the passed in location code in a callout that
1076         // is either a normal HW callout or a symbolic FRU with
1077         // a trusted location code callout.
1078         if ((callout->locationCode() != locationCode) ||
1079             !callout->fruIdentity())
1080         {
1081             continue;
1082         }
1083 
1084         if ((callout->fruIdentity()->failingComponentType() !=
1085              src::FRUIdentity::hardwareFRU) &&
1086             (callout->fruIdentity()->failingComponentType() !=
1087              src::FRUIdentity::symbolicFRUTrustedLocCode))
1088         {
1089             continue;
1090         }
1091 
1092         lg2::info(
1093             "Clearing deconfig flag in PEL {ID} with SRC {SRC} because {LOC} was replaced",
1094             "ID", lg2::hex, pel.id(), "SRC", (*src)->asciiString().substr(0, 8),
1095             "LOC", locationCode);
1096         (*src)->clearErrorStatusFlag(SRC::ErrorStatusFlags::deconfigured);
1097         return true;
1098     }
1099     return false;
1100 }
1101 
hardwarePresent(const std::string & locationCode)1102 void Manager::hardwarePresent(const std::string& locationCode)
1103 {
1104     Repository::PELUpdateFunc handlePowerThermalHardwarePresent =
1105         [locationCode](openpower::pels::PEL& pel) {
1106             return Manager::clearPowerThermalDeconfigFlag(locationCode, pel);
1107         };
1108 
1109     // If the PEL was created by the BMC and has the deconfig flag set,
1110     // it's a candidate to have the deconfig flag cleared.
1111     for (const auto& [id, attributes] : _repo.getAttributesMap())
1112     {
1113         if ((attributes.creator == static_cast<uint8_t>(CreatorID::openBMC)) &&
1114             attributes.deconfig)
1115         {
1116             auto updated = _repo.updatePEL(attributes.path,
1117                                            handlePowerThermalHardwarePresent);
1118 
1119             if (updated)
1120             {
1121                 // Also update the property on D-Bus
1122                 auto objPath = std::string(OBJ_ENTRY) + '/' +
1123                                std::to_string(id.obmcID.id);
1124                 auto entryN = _pelEntries.find(objPath);
1125                 if (entryN != _pelEntries.end())
1126                 {
1127                     entryN->second->deconfig(false);
1128                 }
1129                 else
1130                 {
1131                     lg2::error(
1132                         "Could not find PEL Entry D-Bus object for {PATH}",
1133                         "PATH", objPath);
1134                 }
1135             }
1136         }
1137     }
1138 }
1139 
1140 } // namespace pels
1141 } // namespace openpower
1142