xref: /openbmc/phosphor-logging/extensions/openpower-pels/manager.cpp (revision 760b98178edb7039dd48904a8d2ade5dbea37ef8)
1 /**
2  * Copyright © 2019 IBM Corporation
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *     http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 #include "manager.hpp"
17 
18 #include "additional_data.hpp"
19 #include "elog_serialize.hpp"
20 #include "json_utils.hpp"
21 #include "pel.hpp"
22 #include "pel_entry.hpp"
23 #include "service_indicators.hpp"
24 #include "severity.hpp"
25 
26 #include <sys/inotify.h>
27 #include <unistd.h>
28 
29 #include <phosphor-logging/lg2.hpp>
30 #include <xyz/openbmc_project/Common/error.hpp>
31 #include <xyz/openbmc_project/Logging/Create/server.hpp>
32 
33 #include <filesystem>
34 #include <format>
35 #include <fstream>
36 #include <locale>
37 
38 namespace openpower
39 {
40 namespace pels
41 {
42 
43 using namespace phosphor::logging;
44 namespace fs = std::filesystem;
45 namespace rg = openpower::pels::message;
46 
47 namespace common_error = sdbusplus::xyz::openbmc_project::Common::Error;
48 
49 using Create = sdbusplus::server::xyz::openbmc_project::logging::Create;
50 
51 namespace additional_data
52 {
53 constexpr auto rawPEL = "RAWPEL";
54 constexpr auto esel = "ESEL";
55 constexpr auto error = "ERROR_NAME";
56 } // namespace additional_data
57 
58 constexpr auto defaultLogMessage = "xyz.openbmc_project.Logging.Error.Default";
59 constexpr uint32_t bmcThermalCompID = 0x2700;
60 constexpr uint32_t bmcFansCompID = 0x2800;
61 
~Manager()62 Manager::~Manager()
63 {
64     if (_pelFileDeleteFD != -1)
65     {
66         if (_pelFileDeleteWatchFD != -1)
67         {
68             inotify_rm_watch(_pelFileDeleteFD, _pelFileDeleteWatchFD);
69         }
70         close(_pelFileDeleteFD);
71     }
72 }
73 
create(const std::string & message,uint32_t obmcLogID,uint64_t timestamp,Entry::Level severity,const std::map<std::string,std::string> & additionalData,const std::vector<std::string> & associations,const FFDCEntries & ffdc)74 void Manager::create(const std::string& message, uint32_t obmcLogID,
75                      uint64_t timestamp, Entry::Level severity,
76                      const std::map<std::string, std::string>& additionalData,
77                      const std::vector<std::string>& associations,
78                      const FFDCEntries& ffdc)
79 {
80     AdditionalData ad{additionalData};
81 
82     // If a PEL was passed in via a filename or in an ESEL,
83     // use that.  Otherwise, create one.
84     auto rawPelPath = ad.getValue(additional_data::rawPEL);
85     if (rawPelPath)
86     {
87         addRawPEL(*rawPelPath, obmcLogID);
88     }
89     else
90     {
91         auto esel = ad.getValue(additional_data::esel);
92         if (esel)
93         {
94             addESELPEL(*esel, obmcLogID);
95         }
96         else
97         {
98             createPEL(message, obmcLogID, timestamp, severity, additionalData,
99                       associations, ffdc);
100         }
101     }
102 
103     setEntryPath(obmcLogID);
104     setServiceProviderNotifyFlag(obmcLogID);
105 }
106 
addRawPEL(const std::string & rawPelPath,uint32_t obmcLogID)107 void Manager::addRawPEL(const std::string& rawPelPath, uint32_t obmcLogID)
108 {
109     if (fs::exists(rawPelPath))
110     {
111         std::ifstream file(rawPelPath, std::ios::in | std::ios::binary);
112 
113         auto data = std::vector<uint8_t>(std::istreambuf_iterator<char>(file),
114                                          std::istreambuf_iterator<char>());
115         if (file.fail())
116         {
117             lg2::error(
118                 "Filesystem error reading a raw PEL. File = {FILE}, obmcLogID = {LOGID}",
119                 "FILE", rawPelPath, "LOGID", obmcLogID);
120             // TODO, Decide what to do here. Maybe nothing.
121             return;
122         }
123 
124         file.close();
125 
126         addPEL(data, obmcLogID);
127 
128         std::error_code ec;
129         fs::remove(rawPelPath, ec);
130     }
131     else
132     {
133         lg2::error(
134             "Raw PEL file from BMC event log does not exit. File = {FILE}, obmcLogID = {LOGID}",
135             "FILE", rawPelPath, "LOGID", obmcLogID);
136     }
137 }
138 
addPEL(std::vector<uint8_t> & pelData,uint32_t obmcLogID)139 void Manager::addPEL(std::vector<uint8_t>& pelData, uint32_t obmcLogID)
140 {
141     auto pel = std::make_unique<openpower::pels::PEL>(pelData, obmcLogID);
142     if (pel->valid())
143     {
144         // PELs created by others still need this field set by us.
145         pel->setCommitTime();
146 
147         // Assign Id other than to Hostbot PEL
148         if ((pel->privateHeader()).creatorID() !=
149             static_cast<uint8_t>(CreatorID::hostboot))
150         {
151             pel->assignID();
152         }
153         else
154         {
155             const Repository::LogID id{Repository::LogID::Pel(pel->id())};
156             auto result = _repo.hasPEL(id);
157             if (result)
158             {
159                 lg2::warning(
160                     "Duplicate HostBoot PEL ID {ID} found, moving it to archive folder",
161                     "ID", lg2::hex, pel->id());
162 
163                 _repo.archivePEL(*pel);
164 
165                 // No need to keep around the openBMC event log entry
166                 scheduleObmcLogDelete(obmcLogID);
167                 return;
168             }
169         }
170 
171         // Update System Info to Extended User Data
172         pel->updateSysInfoInExtendedUserDataSection(*_dataIface);
173 
174         // Check for severity 0x51 and update boot progress SRC
175         updateProgressSRC(pel);
176 
177         try
178         {
179             lg2::debug("Adding external PEL {ID} (BMC ID {BMCID}) to repo",
180                        "ID", lg2::hex, pel->id(), "BMCID", obmcLogID);
181             _repo.add(pel);
182 
183             if (_repo.sizeWarning())
184             {
185                 scheduleRepoPrune();
186             }
187 
188             // Activate any resulting service indicators if necessary
189             auto policy = service_indicators::getPolicy(*_dataIface);
190             policy->activate(*pel);
191         }
192         catch (const std::exception& e)
193         {
194             // Probably a full or r/o filesystem, not much we can do.
195             lg2::error("Unable to add PEL {ID} to Repository", "ID", lg2::hex,
196                        pel->id());
197         }
198 
199         updateEventId(pel);
200         updateResolution(*pel);
201         serializeLogEntry(obmcLogID);
202         createPELEntry(obmcLogID);
203 
204         // Check if firmware should quiesce system due to error
205         checkPelAndQuiesce(pel);
206     }
207     else
208     {
209         lg2::error("Invalid PEL received from the host. BMC ID = {ID}", "ID",
210                    obmcLogID);
211 
212         AdditionalData ad;
213         ad.add("PLID", getNumberString("0x%08X", pel->plid()));
214         ad.add("OBMC_LOG_ID", std::to_string(obmcLogID));
215         ad.add("PEL_SIZE", std::to_string(pelData.size()));
216 
217         std::string asciiString;
218         auto src = pel->primarySRC();
219         if (src)
220         {
221             asciiString = (*src)->asciiString();
222         }
223 
224         ad.add("SRC", asciiString);
225 
226         _eventLogger.log("org.open_power.Logging.Error.BadHostPEL",
227                          Entry::Level::Error, ad);
228 
229         // Save it to a file for debug in the lab.  Just keep the latest.
230         // Not adding it to the PEL because it could already be max size
231         // and don't want to truncate an already invalid PEL.
232         std::ofstream pelFile{getPELRepoPath() / "badPEL"};
233         pelFile.write(reinterpret_cast<const char*>(pelData.data()),
234                       pelData.size());
235 
236         // No need to keep around the openBMC event log entry
237         scheduleObmcLogDelete(obmcLogID);
238     }
239 }
240 
addESELPEL(const std::string & esel,uint32_t obmcLogID)241 void Manager::addESELPEL(const std::string& esel, uint32_t obmcLogID)
242 {
243     std::vector<uint8_t> data;
244 
245     lg2::debug("Adding PEL from ESEL. BMC ID = {ID}", "ID", obmcLogID);
246 
247     try
248     {
249         data = std::move(eselToRawData(esel));
250     }
251     catch (const std::exception& e)
252     {
253         // Try to add it below anyway, so it follows the usual bad data path.
254         lg2::error("Problems converting ESEL string to a byte vector");
255     }
256 
257     addPEL(data, obmcLogID);
258 }
259 
eselToRawData(const std::string & esel)260 std::vector<uint8_t> Manager::eselToRawData(const std::string& esel)
261 {
262     std::vector<uint8_t> data;
263     std::string byteString;
264 
265     // As the eSEL string looks like: "50 48 00 ab ..." there are 3
266     // characters per raw byte, and since the actual PEL data starts
267     // at the 16th byte, the code will grab the PEL data starting at
268     // offset 48 in the string.
269     static constexpr size_t pelStart = 16 * 3;
270 
271     if (esel.size() <= pelStart)
272     {
273         lg2::error("ESEL data too short, length = {LEN}", "LEN", esel.size());
274         throw std::length_error("ESEL data too short");
275     }
276 
277     for (size_t i = pelStart; i < esel.size(); i += 3)
278     {
279         if (i + 1 < esel.size())
280         {
281             byteString = esel.substr(i, 2);
282             data.push_back(std::stoi(byteString, nullptr, 16));
283         }
284         else
285         {
286             lg2::error("ESEL data too short, length = {LEN}", "LEN",
287                        esel.size());
288             throw std::length_error("ESEL data too short");
289         }
290     }
291 
292     return data;
293 }
294 
erase(uint32_t obmcLogID)295 void Manager::erase(uint32_t obmcLogID)
296 {
297     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
298 
299     auto path = std::string(OBJ_ENTRY) + '/' + std::to_string(obmcLogID);
300     _pelEntries.erase(path);
301     _repo.remove(id);
302 }
303 
getLogIDWithHwIsolation(std::vector<uint32_t> & idsWithHwIsoEntry)304 void Manager::getLogIDWithHwIsolation(std::vector<uint32_t>& idsWithHwIsoEntry)
305 {
306     idsWithHwIsoEntry = _dataIface->getLogIDWithHwIsolation();
307 }
308 
isDeleteProhibited(uint32_t obmcLogID)309 bool Manager::isDeleteProhibited(uint32_t obmcLogID)
310 {
311     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
312     if (!_repo.hasPEL(id))
313     {
314         return false;
315     }
316     auto entryPath{std::string(OBJ_ENTRY) + '/' + std::to_string(obmcLogID)};
317     auto entry = _pelEntries.find(entryPath);
318     if (entry != _pelEntries.end())
319     {
320         if (entry->second->guard())
321         {
322             auto hwIsolationAssocPaths = _dataIface->getAssociatedPaths(
323                 entryPath += "/isolated_hw_entry", "/", 0,
324                 {"xyz.openbmc_project.HardwareIsolation.Entry"});
325             if (!hwIsolationAssocPaths.empty())
326             {
327                 return true;
328             }
329         }
330     }
331     return false;
332 }
333 
convertToPelFFDC(const FFDCEntries & ffdc)334 PelFFDC Manager::convertToPelFFDC(const FFDCEntries& ffdc)
335 {
336     PelFFDC pelFFDC;
337 
338     std::for_each(ffdc.begin(), ffdc.end(), [&pelFFDC](const auto& f) {
339         PelFFDCfile pf;
340         pf.subType = std::get<ffdcSubtypePos>(f);
341         pf.version = std::get<ffdcVersionPos>(f);
342         pf.fd = std::get<ffdcFDPos>(f);
343 
344         switch (std::get<ffdcFormatPos>(f))
345         {
346             case Create::FFDCFormat::JSON:
347                 pf.format = UserDataFormat::json;
348                 break;
349             case Create::FFDCFormat::CBOR:
350                 pf.format = UserDataFormat::cbor;
351                 break;
352             case Create::FFDCFormat::Text:
353                 pf.format = UserDataFormat::text;
354                 break;
355             case Create::FFDCFormat::Custom:
356                 pf.format = UserDataFormat::custom;
357                 break;
358         }
359 
360         pelFFDC.push_back(pf);
361     });
362 
363     return pelFFDC;
364 }
365 
createPEL(const std::string & message,uint32_t obmcLogID,uint64_t timestamp,phosphor::logging::Entry::Level severity,const std::map<std::string,std::string> & additionalData,const std::vector<std::string> &,const FFDCEntries & ffdc)366 void Manager::createPEL(
367     const std::string& message, uint32_t obmcLogID, uint64_t timestamp,
368     phosphor::logging::Entry::Level severity,
369     const std::map<std::string, std::string>& additionalData,
370     const std::vector<std::string>& /*associations*/, const FFDCEntries& ffdc)
371 {
372     auto entry = _registry.lookup(message, rg::LookupType::name);
373     auto pelFFDC = convertToPelFFDC(ffdc);
374     AdditionalData ad{additionalData};
375     std::string msg;
376 
377     if (!entry)
378     {
379         // Instead, get the default entry that means there is no
380         // other matching entry.  This error will still use the
381         // AdditionalData values of the original error, and this
382         // code will add the error message value that wasn't found
383         // to this AD.  This way, there will at least be a PEL,
384         // possibly with callouts, to allow users to debug the
385         // issue that caused the error even without its own PEL.
386         lg2::error("Event not found in PEL message registry: {MSG}", "MSG",
387                    message);
388 
389         entry = _registry.lookup(defaultLogMessage, rg::LookupType::name);
390         if (!entry)
391         {
392             lg2::error("Default event not found in PEL message registry");
393             return;
394         }
395 
396         ad.add(additional_data::error, message);
397     }
398 
399     auto pel = std::make_unique<openpower::pels::PEL>(
400         *entry, obmcLogID, timestamp, severity, ad, pelFFDC, *_dataIface,
401         *_journal);
402 
403     _repo.add(pel);
404 
405     if (_repo.sizeWarning())
406     {
407         scheduleRepoPrune();
408     }
409 
410     auto src = pel->primarySRC();
411     if (src)
412     {
413         auto asciiString = (*src)->asciiString();
414         while (asciiString.back() == ' ')
415         {
416             asciiString.pop_back();
417         }
418         lg2::info("Created PEL {ID} (BMC ID {BMCID}) with SRC {SRC}", "ID",
419                   lg2::hex, pel->id(), "BMCID", pel->obmcLogID(), "SRC",
420                   asciiString);
421     }
422 
423     // Check for severity 0x51 and update boot progress SRC
424     updateProgressSRC(pel);
425 
426     // Activate any resulting service indicators if necessary
427     auto policy = service_indicators::getPolicy(*_dataIface);
428     policy->activate(*pel);
429 
430     updateDBusSeverity(*pel);
431     updateEventId(pel);
432     updateResolution(*pel);
433     serializeLogEntry(obmcLogID);
434     createPELEntry(obmcLogID);
435 
436     // Check if firmware should quiesce system due to error
437     checkPelAndQuiesce(pel);
438 }
439 
getPEL(uint32_t pelID)440 sdbusplus::message::unix_fd Manager::getPEL(uint32_t pelID)
441 {
442     Repository::LogID id{Repository::LogID::Pel(pelID)};
443     std::optional<int> fd;
444 
445     lg2::debug("getPEL {ID}", "ID", lg2::hex, pelID);
446 
447     try
448     {
449         fd = _repo.getPELFD(id);
450     }
451     catch (const std::exception& e)
452     {
453         throw common_error::InternalFailure();
454     }
455 
456     if (!fd)
457     {
458         throw common_error::InvalidArgument();
459     }
460 
461     scheduleFDClose(*fd);
462 
463     return *fd;
464 }
465 
scheduleFDClose(int fd)466 void Manager::scheduleFDClose(int fd)
467 {
468     _fdCloserEventSource = std::make_unique<sdeventplus::source::Defer>(
469         _event, std::bind(std::mem_fn(&Manager::closeFD), this, fd,
470                           std::placeholders::_1));
471 }
472 
closeFD(int fd,sdeventplus::source::EventBase &)473 void Manager::closeFD(int fd, sdeventplus::source::EventBase& /*source*/)
474 {
475     close(fd);
476     _fdCloserEventSource.reset();
477 }
478 
getPELFromOBMCID(uint32_t obmcLogID)479 std::vector<uint8_t> Manager::getPELFromOBMCID(uint32_t obmcLogID)
480 {
481     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
482     std::optional<std::vector<uint8_t>> data;
483 
484     lg2::debug("getPELFromOBMCID  {BMCID}", "BMCID", obmcLogID);
485 
486     try
487     {
488         data = _repo.getPELData(id);
489     }
490     catch (const std::exception& e)
491     {
492         throw common_error::InternalFailure();
493     }
494 
495     if (!data)
496     {
497         throw common_error::InvalidArgument();
498     }
499 
500     return *data;
501 }
502 
hostAck(uint32_t pelID)503 void Manager::hostAck(uint32_t pelID)
504 {
505     Repository::LogID id{Repository::LogID::Pel(pelID)};
506 
507     lg2::debug("HostHack {ID}", "ID", lg2::hex, pelID);
508 
509     if (!_repo.hasPEL(id))
510     {
511         throw common_error::InvalidArgument();
512     }
513 
514     if (_hostNotifier)
515     {
516         _hostNotifier->ackPEL(pelID);
517     }
518 }
519 
hostReject(uint32_t pelID,RejectionReason reason)520 void Manager::hostReject(uint32_t pelID, RejectionReason reason)
521 {
522     Repository::LogID id{Repository::LogID::Pel(pelID)};
523 
524     lg2::debug("HostReject {ID}, reason = {REASON}", "ID", lg2::hex, pelID,
525                "REASON", reason);
526 
527     if (!_repo.hasPEL(id))
528     {
529         throw common_error::InvalidArgument();
530     }
531 
532     if (reason == RejectionReason::BadPEL)
533     {
534         AdditionalData data;
535         data.add("BAD_ID", getNumberString("0x%08X", pelID));
536         _eventLogger.log("org.open_power.Logging.Error.SentBadPELToHost",
537                          Entry::Level::Informational, data);
538         if (_hostNotifier)
539         {
540             _hostNotifier->setBadPEL(pelID);
541         }
542     }
543     else if ((reason == RejectionReason::HostFull) && _hostNotifier)
544     {
545         _hostNotifier->setHostFull(pelID);
546     }
547 }
548 
scheduleRepoPrune()549 void Manager::scheduleRepoPrune()
550 {
551     _repoPrunerEventSource = std::make_unique<sdeventplus::source::Defer>(
552         _event, std::bind(std::mem_fn(&Manager::pruneRepo), this,
553                           std::placeholders::_1));
554 }
555 
pruneRepo(sdeventplus::source::EventBase &)556 void Manager::pruneRepo(sdeventplus::source::EventBase& /*source*/)
557 {
558     auto idsWithHwIsoEntry = _dataIface->getLogIDWithHwIsolation();
559 
560     auto idsToDelete = _repo.prune(idsWithHwIsoEntry);
561 
562     // Remove the OpenBMC event logs for the PELs that were just removed.
563     std::for_each(idsToDelete.begin(), idsToDelete.end(),
564                   [this](auto id) { this->_logManager.erase(id); });
565 
566     _repoPrunerEventSource.reset();
567 }
568 
setupPELDeleteWatch()569 void Manager::setupPELDeleteWatch()
570 {
571     _pelFileDeleteFD = inotify_init1(IN_NONBLOCK);
572     if (-1 == _pelFileDeleteFD)
573     {
574         auto e = errno;
575         lg2::error("inotify_init1 failed with errno {ERRNO}", "ERRNO", e);
576         abort();
577     }
578 
579     _pelFileDeleteWatchFD = inotify_add_watch(
580         _pelFileDeleteFD, _repo.repoPath().c_str(), IN_DELETE);
581     if (-1 == _pelFileDeleteWatchFD)
582     {
583         auto e = errno;
584         lg2::error("inotify_add_watch failed with errno {ERRNO}", "ERRNO", e);
585         abort();
586     }
587 
588     _pelFileDeleteEventSource = std::make_unique<sdeventplus::source::IO>(
589         _event, _pelFileDeleteFD, EPOLLIN,
590         std::bind(std::mem_fn(&Manager::pelFileDeleted), this,
591                   std::placeholders::_1, std::placeholders::_2,
592                   std::placeholders::_3));
593 }
594 
pelFileDeleted(sdeventplus::source::IO &,int,uint32_t revents)595 void Manager::pelFileDeleted(sdeventplus::source::IO& /*io*/, int /*fd*/,
596                              uint32_t revents)
597 {
598     if (!(revents & EPOLLIN))
599     {
600         return;
601     }
602 
603     // An event for 1 PEL uses 48B. When all PELs are deleted at once,
604     // as many events as there is room for can be handled in one callback.
605     // A size of 2000 will allow 41 to be processed, with additional
606     // callbacks being needed to process the remaining ones.
607     std::array<uint8_t, 2000> data{};
608     auto bytesRead = read(_pelFileDeleteFD, data.data(), data.size());
609     if (bytesRead < 0)
610     {
611         auto e = errno;
612         lg2::error("Failed reading data from inotify event, errno = {ERRNO}",
613                    "ERRNO", e);
614         abort();
615     }
616 
617     auto offset = 0;
618     while (offset < bytesRead)
619     {
620         auto event = reinterpret_cast<inotify_event*>(&data[offset]);
621         if (event->mask & IN_DELETE)
622         {
623             std::string filename{event->name};
624 
625             // Get the PEL ID from the filename and tell the
626             // repo it's been removed, and then delete the BMC
627             // event log if it's there.
628             auto pos = filename.find_first_of('_');
629             if (pos != std::string::npos)
630             {
631                 try
632                 {
633                     auto idString = filename.substr(pos + 1);
634                     auto pelID = std::stoul(idString, nullptr, 16);
635 
636                     Repository::LogID id{Repository::LogID::Pel(pelID)};
637                     auto removedLogID = _repo.remove(id);
638                     if (removedLogID)
639                     {
640                         _logManager.erase(removedLogID->obmcID.id);
641                     }
642                 }
643                 catch (const std::exception& e)
644                 {
645                     lg2::info("Could not find PEL ID from its filename {NAME}",
646                               "NAME", filename);
647                 }
648             }
649         }
650 
651         offset += offsetof(inotify_event, name) + event->len;
652     }
653 }
654 
createPELWithFFDCFiles(std::string message,Entry::Level severity,std::map<std::string,std::string> additionalData,std::vector<std::tuple<sdbusplus::server::xyz::openbmc_project::logging::Create::FFDCFormat,uint8_t,uint8_t,sdbusplus::message::unix_fd>> fFDC)655 std::tuple<uint32_t, uint32_t> Manager::createPELWithFFDCFiles(
656     std::string message, Entry::Level severity,
657     std::map<std::string, std::string> additionalData,
658     std::vector<std::tuple<
659         sdbusplus::server::xyz::openbmc_project::logging::Create::FFDCFormat,
660         uint8_t, uint8_t, sdbusplus::message::unix_fd>>
661         fFDC)
662 {
663     _logManager.create(message, severity, additionalData, fFDC);
664 
665     return {_logManager.lastEntryID(), _repo.lastPelID()};
666 }
667 
getPELJSON(uint32_t obmcLogID)668 std::string Manager::getPELJSON(uint32_t obmcLogID)
669 {
670     // Throws InvalidArgument if not found
671     auto pelID = getPELIdFromBMCLogId(obmcLogID);
672 
673     auto cmd = std::format("/usr/bin/peltool -i {:#x}", pelID);
674 
675     FILE* pipe = popen(cmd.c_str(), "r");
676     if (!pipe)
677     {
678         lg2::error("Error running cmd: {CMD}", "CMD", cmd);
679         throw common_error::InternalFailure();
680     }
681 
682     std::string output;
683     std::array<char, 1024> buffer;
684     while (fgets(buffer.data(), buffer.size(), pipe) != nullptr)
685     {
686         output.append(buffer.data());
687     }
688 
689     int rc = pclose(pipe);
690     if (WEXITSTATUS(rc) != 0)
691     {
692         lg2::error("Error running cmd: {CMD}, rc = {RC}", "CMD", cmd, "RC", rc);
693         throw common_error::InternalFailure();
694     }
695 
696     return output;
697 }
698 
checkPelAndQuiesce(std::unique_ptr<openpower::pels::PEL> & pel)699 void Manager::checkPelAndQuiesce(std::unique_ptr<openpower::pels::PEL>& pel)
700 {
701     if ((pel->userHeader().severity() ==
702          static_cast<uint8_t>(SeverityType::nonError)) ||
703         (pel->userHeader().severity() ==
704          static_cast<uint8_t>(SeverityType::recovered)))
705     {
706         lg2::debug(
707             "PEL severity informational or recovered. no quiesce needed");
708         return;
709     }
710     if (!_logManager.isQuiesceOnErrorEnabled())
711     {
712         lg2::debug("QuiesceOnHwError not enabled, no quiesce needed");
713         return;
714     }
715 
716     CreatorID creatorID{pel->privateHeader().creatorID()};
717 
718     if ((creatorID != CreatorID::openBMC) &&
719         (creatorID != CreatorID::hostboot) &&
720         (creatorID != CreatorID::ioDrawer) && (creatorID != CreatorID::occ) &&
721         (creatorID != CreatorID::phyp))
722     {
723         return;
724     }
725 
726     // Now check if it has any type of callout
727     if (pel->isHwCalloutPresent())
728     {
729         lg2::info(
730             "QuiesceOnHwError enabled, PEL severity not nonError or recovered, "
731             "and callout is present");
732 
733         _logManager.quiesceOnError(pel->obmcLogID());
734     }
735 }
736 
getEventId(const openpower::pels::PEL & pel) const737 std::string Manager::getEventId(const openpower::pels::PEL& pel) const
738 {
739     std::string str;
740     auto src = pel.primarySRC();
741     if (src)
742     {
743         const auto& hexwords = (*src)->hexwordData();
744 
745         std::string refcode = (*src)->asciiString();
746         size_t pos = refcode.find_last_not_of(0x20);
747         if (pos != std::string::npos)
748         {
749             refcode.erase(pos + 1);
750         }
751         str = refcode;
752 
753         for (auto& value : hexwords)
754         {
755             str += " ";
756             str += getNumberString("%08X", value);
757         }
758     }
759     return sanitizeFieldForDBus(str);
760 }
761 
updateEventId(std::unique_ptr<openpower::pels::PEL> & pel)762 void Manager::updateEventId(std::unique_ptr<openpower::pels::PEL>& pel)
763 {
764     std::string eventIdStr = getEventId(*pel);
765 
766     auto entryN = _logManager.entries.find(pel->obmcLogID());
767     if (entryN != _logManager.entries.end())
768     {
769         entryN->second->eventId(eventIdStr, true);
770     }
771 }
772 
sanitizeFieldForDBus(std::string field)773 std::string Manager::sanitizeFieldForDBus(std::string field)
774 {
775     std::for_each(field.begin(), field.end(), [](char& ch) {
776         if (((ch < ' ') || (ch > '~')) && (ch != '\n') && (ch != '\t'))
777         {
778             ch = ' ';
779         }
780     });
781     return field;
782 }
783 
getResolution(const openpower::pels::PEL & pel) const784 std::string Manager::getResolution(const openpower::pels::PEL& pel) const
785 {
786     std::string str;
787     std::string resolution;
788     auto src = pel.primarySRC();
789     if (src)
790     {
791         // First extract the callout pointer and then go through
792         const auto& callouts = (*src)->callouts();
793         namespace pv = openpower::pels::pel_values;
794         // All PELs dont have callout, check before parsing callout data
795         if (callouts)
796         {
797             const auto& entries = callouts->callouts();
798             // Entry starts with index 1
799             uint8_t index = 1;
800             for (auto& entry : entries)
801             {
802                 resolution += std::to_string(index) + ". ";
803                 // Adding Location code to resolution
804                 if (!entry->locationCode().empty())
805                     resolution += "Location Code: " + entry->locationCode() +
806                                   ", ";
807                 if (entry->fruIdentity())
808                 {
809                     // Get priority and set the resolution string
810                     str = pv::getValue(entry->priority(),
811                                        pel_values::calloutPriorityValues,
812                                        pel_values::registryNamePos);
813                     str[0] = toupper(str[0]);
814                     resolution += "Priority: " + str + ", ";
815                     if (entry->fruIdentity()->getPN().has_value())
816                     {
817                         resolution +=
818                             "PN: " + entry->fruIdentity()->getPN().value() +
819                             ", ";
820                     }
821                     if (entry->fruIdentity()->getSN().has_value())
822                     {
823                         resolution +=
824                             "SN: " + entry->fruIdentity()->getSN().value() +
825                             ", ";
826                     }
827                     if (entry->fruIdentity()->getCCIN().has_value())
828                     {
829                         resolution +=
830                             "CCIN: " + entry->fruIdentity()->getCCIN().value() +
831                             ", ";
832                     }
833                     // Add the maintenance procedure
834                     if (entry->fruIdentity()->getMaintProc().has_value())
835                     {
836                         resolution +=
837                             "Procedure: " +
838                             entry->fruIdentity()->getMaintProc().value() + ", ";
839                     }
840                 }
841                 resolution.resize(resolution.size() - 2);
842                 resolution += "\n";
843                 index++;
844             }
845         }
846     }
847     return sanitizeFieldForDBus(resolution);
848 }
849 
updateResolution(const openpower::pels::PEL & pel)850 bool Manager::updateResolution(const openpower::pels::PEL& pel)
851 {
852     std::string callouts = getResolution(pel);
853     auto entryN = _logManager.entries.find(pel.obmcLogID());
854     if (entryN != _logManager.entries.end())
855     {
856         entryN->second->resolution(callouts, true);
857     }
858 
859     return false;
860 }
861 
serializeLogEntry(uint32_t obmcLogID)862 void Manager::serializeLogEntry(uint32_t obmcLogID)
863 {
864     auto entryN = _logManager.entries.find(obmcLogID);
865     if (entryN != _logManager.entries.end())
866     {
867         serialize(*entryN->second);
868     }
869 }
870 
updateDBusSeverity(const openpower::pels::PEL & pel)871 void Manager::updateDBusSeverity(const openpower::pels::PEL& pel)
872 {
873     // The final severity of the PEL may not agree with the
874     // original severity of the D-Bus event log.  Update the
875     // D-Bus property to match in some cases.  This is to
876     // ensure there isn't a Critical or Warning Redfish event
877     // log for an informational or recovered PEL (or vice versa).
878     // This doesn't make an explicit call to serialize the new
879     // event log property value because updateEventId() is called
880     // right after this and will do it.
881     auto sevType =
882         static_cast<SeverityType>(pel.userHeader().severity() & 0xF0);
883 
884     auto entryN = _logManager.entries.find(pel.obmcLogID());
885     if (entryN != _logManager.entries.end())
886     {
887         auto newSeverity =
888             fixupLogSeverity(entryN->second->severity(), sevType);
889         if (newSeverity)
890         {
891             lg2::info("Changing event log {ID} severity from {OLD} "
892                       "to {NEW} to match PEL",
893                       "ID", lg2::hex, entryN->second->id(), "OLD",
894                       Entry::convertLevelToString(entryN->second->severity()),
895                       "NEW", Entry::convertLevelToString(*newSeverity));
896 
897             entryN->second->severity(*newSeverity, true);
898         }
899     }
900 }
901 
setEntryPath(uint32_t obmcLogID)902 void Manager::setEntryPath(uint32_t obmcLogID)
903 {
904     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
905     if (auto attributes = _repo.getPELAttributes(id); attributes)
906     {
907         auto& attr = attributes.value().get();
908         auto entry = _logManager.entries.find(obmcLogID);
909         if (entry != _logManager.entries.end())
910         {
911             entry->second->path(attr.path, true);
912         }
913     }
914 }
915 
setServiceProviderNotifyFlag(uint32_t obmcLogID)916 void Manager::setServiceProviderNotifyFlag(uint32_t obmcLogID)
917 {
918     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
919     if (auto attributes = _repo.getPELAttributes(id); attributes)
920     {
921         auto& attr = attributes.value().get();
922         auto entry = _logManager.entries.find(obmcLogID);
923         if (entry != _logManager.entries.end())
924         {
925             if (attr.actionFlags.test(callHomeFlagBit))
926             {
927                 entry->second->serviceProviderNotify(Entry::Notify::Notify,
928                                                      true);
929             }
930             else
931             {
932                 entry->second->serviceProviderNotify(Entry::Notify::Inhibit,
933                                                      true);
934             }
935         }
936     }
937 }
938 
createPELEntry(uint32_t obmcLogID,bool skipIaSignal)939 void Manager::createPELEntry(uint32_t obmcLogID, bool skipIaSignal)
940 {
941     std::map<std::string, PropertiesVariant> varData;
942     Repository::LogID id{Repository::LogID::Obmc(obmcLogID)};
943     if (auto attributes = _repo.getPELAttributes(id); attributes)
944     {
945         namespace pv = openpower::pels::pel_values;
946         auto& attr = attributes.value().get();
947 
948         // get the hidden flag values
949         auto sevType = static_cast<SeverityType>(attr.severity & 0xF0);
950         auto isHidden = true;
951         if (((sevType != SeverityType::nonError) &&
952              attr.actionFlags.test(reportFlagBit) &&
953              !attr.actionFlags.test(hiddenFlagBit)) ||
954             ((sevType == SeverityType::nonError) &&
955              attr.actionFlags.test(serviceActionFlagBit)))
956         {
957             isHidden = false;
958         }
959         varData.emplace(std::string("Hidden"), isHidden);
960         varData.emplace(
961             std::string("Subsystem"),
962             pv::getValue(attr.subsystem, pel_values::subsystemValues));
963 
964         varData.emplace(
965             std::string("ManagementSystemAck"),
966             (attr.hmcState == TransmissionState::acked ? true : false));
967 
968         varData.emplace("PlatformLogID", attr.plid);
969         varData.emplace("Deconfig", attr.deconfig);
970         varData.emplace("Guard", attr.guard);
971         varData.emplace("Timestamp", attr.creationTime);
972 
973         // Path to create PELEntry Interface is same as PEL
974         auto path = std::string(OBJ_ENTRY) + '/' + std::to_string(obmcLogID);
975         // Create Interface for PELEntry and set properties
976         auto pelEntry = std::make_unique<PELEntry>(_logManager.getBus(), path,
977                                                    varData, obmcLogID, &_repo);
978         if (!skipIaSignal)
979         {
980             pelEntry->emit_added();
981         }
982         _pelEntries.emplace(std::move(path), std::move(pelEntry));
983     }
984 }
985 
getPELIdFromBMCLogId(uint32_t bmcLogId)986 uint32_t Manager::getPELIdFromBMCLogId(uint32_t bmcLogId)
987 {
988     Repository::LogID id{Repository::LogID::Obmc(bmcLogId)};
989     if (auto logId = _repo.getLogID(id); !logId.has_value())
990     {
991         throw common_error::InvalidArgument();
992     }
993     else
994     {
995         return logId->pelID.id;
996     }
997 }
998 
getBMCLogIdFromPELId(uint32_t pelId)999 uint32_t Manager::getBMCLogIdFromPELId(uint32_t pelId)
1000 {
1001     Repository::LogID id{Repository::LogID::Pel(pelId)};
1002     if (auto logId = _repo.getLogID(id); !logId.has_value())
1003     {
1004         throw common_error::InvalidArgument();
1005     }
1006     else
1007     {
1008         return logId->obmcID.id;
1009     }
1010 }
1011 
updateProgressSRC(std::unique_ptr<openpower::pels::PEL> & pel) const1012 void Manager::updateProgressSRC(
1013     std::unique_ptr<openpower::pels::PEL>& pel) const
1014 {
1015     // Check for pel severity of type - 0x51 = critical error, system
1016     // termination
1017     if (pel->userHeader().severity() == 0x51)
1018     {
1019         auto src = pel->primarySRC();
1020         if (src)
1021         {
1022             std::vector<uint8_t> asciiSRC = (*src)->getSrcStruct();
1023             uint64_t srcRefCode = 0;
1024 
1025             // Read bytes from offset [40-47] e.g. BD8D1001
1026             for (int i = 0; i < 8; i++)
1027             {
1028                 srcRefCode |=
1029                     (static_cast<uint64_t>(asciiSRC[40 + i]) << (8 * i));
1030             }
1031 
1032             try
1033             {
1034                 _dataIface->createProgressSRC(srcRefCode, asciiSRC);
1035             }
1036             catch (const std::exception&)
1037             {
1038                 // Exception - may be no boot progress interface on dbus
1039             }
1040         }
1041     }
1042 }
1043 
scheduleObmcLogDelete(uint32_t obmcLogID)1044 void Manager::scheduleObmcLogDelete(uint32_t obmcLogID)
1045 {
1046     _obmcLogDeleteEventSource = std::make_unique<sdeventplus::source::Defer>(
1047         _event, std::bind(std::mem_fn(&Manager::deleteObmcLog), this,
1048                           std::placeholders::_1, obmcLogID));
1049 }
1050 
deleteObmcLog(sdeventplus::source::EventBase &,uint32_t obmcLogID)1051 void Manager::deleteObmcLog(sdeventplus::source::EventBase&, uint32_t obmcLogID)
1052 {
1053     lg2::info("Removing event log with no PEL: {BMCID}", "BMCID", obmcLogID);
1054     _logManager.erase(obmcLogID);
1055     _obmcLogDeleteEventSource.reset();
1056 }
1057 
clearPowerThermalDeconfigFlag(const std::string & locationCode,openpower::pels::PEL & pel)1058 bool Manager::clearPowerThermalDeconfigFlag(const std::string& locationCode,
1059                                             openpower::pels::PEL& pel)
1060 {
1061     // The requirements state that only power-thermal or
1062     // fan PELs need their deconfig flag cleared.
1063     static const std::vector<uint32_t> compIDs{bmcThermalCompID, bmcFansCompID};
1064 
1065     if (std::find(compIDs.begin(), compIDs.end(),
1066                   pel.privateHeader().header().componentID) == compIDs.end())
1067     {
1068         return false;
1069     }
1070 
1071     auto src = pel.primarySRC();
1072     const auto& callouts = (*src)->callouts();
1073     if (!callouts)
1074     {
1075         return false;
1076     }
1077 
1078     for (const auto& callout : callouts->callouts())
1079     {
1080         // Look for the passed in location code in a callout that
1081         // is either a normal HW callout or a symbolic FRU with
1082         // a trusted location code callout.
1083         if ((callout->locationCode() != locationCode) ||
1084             !callout->fruIdentity())
1085         {
1086             continue;
1087         }
1088 
1089         if ((callout->fruIdentity()->failingComponentType() !=
1090              src::FRUIdentity::hardwareFRU) &&
1091             (callout->fruIdentity()->failingComponentType() !=
1092              src::FRUIdentity::symbolicFRUTrustedLocCode))
1093         {
1094             continue;
1095         }
1096 
1097         lg2::info(
1098             "Clearing deconfig flag in PEL {ID} with SRC {SRC} because {LOC} was replaced",
1099             "ID", lg2::hex, pel.id(), "SRC", (*src)->asciiString().substr(0, 8),
1100             "LOC", locationCode);
1101         (*src)->clearErrorStatusFlag(SRC::ErrorStatusFlags::deconfigured);
1102         return true;
1103     }
1104     return false;
1105 }
1106 
hardwarePresent(const std::string & locationCode)1107 void Manager::hardwarePresent(const std::string& locationCode)
1108 {
1109     Repository::PELUpdateFunc handlePowerThermalHardwarePresent =
1110         [locationCode](openpower::pels::PEL& pel) {
1111             return Manager::clearPowerThermalDeconfigFlag(locationCode, pel);
1112         };
1113 
1114     // If the PEL was created by the BMC and has the deconfig flag set,
1115     // it's a candidate to have the deconfig flag cleared.
1116     for (const auto& [id, attributes] : _repo.getAttributesMap())
1117     {
1118         if ((attributes.creator == static_cast<uint8_t>(CreatorID::openBMC)) &&
1119             attributes.deconfig)
1120         {
1121             auto updated = _repo.updatePEL(attributes.path,
1122                                            handlePowerThermalHardwarePresent);
1123 
1124             if (updated)
1125             {
1126                 // Also update the property on D-Bus
1127                 auto objPath = std::string(OBJ_ENTRY) + '/' +
1128                                std::to_string(id.obmcID.id);
1129                 auto entryN = _pelEntries.find(objPath);
1130                 if (entryN != _pelEntries.end())
1131                 {
1132                     entryN->second->deconfig(false);
1133                 }
1134                 else
1135                 {
1136                     lg2::error(
1137                         "Could not find PEL Entry D-Bus object for {PATH}",
1138                         "PATH", objPath);
1139                 }
1140             }
1141         }
1142     }
1143 }
1144 
1145 } // namespace pels
1146 } // namespace openpower
1147