1 #include <unistd.h>
2 
3 #include <attn/attn_common.hpp>
4 #include <attn/attn_dbus.hpp>
5 #include <attn/attn_dump.hpp>
6 #include <attn/attn_logging.hpp>
7 #include <attn/pel/pel_minimal.hpp>
8 #include <phosphor-logging/log.hpp>
9 
10 namespace attn
11 {
12 
13 /** @brief Journal entry of type INFO using phosphor logging */
14 template <>
15 void trace<INFO>(const char* i_message)
16 {
17     phosphor::logging::log<phosphor::logging::level::INFO>(i_message);
18 }
19 
20 template <>
21 void trace<ERROR>(const char* i_message)
22 {
23     phosphor::logging::log<phosphor::logging::level::ERR>(i_message);
24 }
25 
26 /** @brief Tuple containing information about ffdc files */
27 using FFDCTuple =
28     std::tuple<util::FFDCFormat, uint8_t, uint8_t, sdbusplus::message::unix_fd>;
29 
30 /** @brief Gather messages from the journal */
31 std::vector<std::string> sdjGetMessages(const std::string& field,
32                                         const std::string& fieldValue,
33                                         unsigned int max);
34 
35 /**
36  * Create FFDCTuple objects corresponding to the specified FFDC files.
37  *
38  * The D-Bus method to create an error log requires a vector of tuples to
39  * pass in the FFDC file information.
40  *
41  * @param   files - FFDC files
42  * @return  vector of FFDCTuple objects
43  */
44 std::vector<FFDCTuple>
45     createFFDCTuples(const std::vector<util::FFDCFile>& files)
46 {
47     std::vector<FFDCTuple> ffdcTuples{};
48     util::transformFFDC(files, ffdcTuples);
49 
50     return ffdcTuples;
51 }
52 
53 /**
54  * @brief Create an FFDCFile object containing raw data
55  *
56  * Throws an exception if an error occurs.
57  *
58  * @param   i_buffer - raw data to add to ffdc faw data file
59  * @param   i_size - size of the raw data
60  * @return  FFDCFile object
61  */
62 util::FFDCFile createFFDCRawFile(void* i_buffer, size_t i_size)
63 {
64     util::FFDCFile file{util::FFDCFormat::Custom};
65 
66     // Write buffer to file and then reset file description file offset
67     int fd          = file.getFileDescriptor();
68     size_t numBytes = write(fd, static_cast<char*>(i_buffer), i_size);
69     if (i_size != numBytes)
70     {
71         std::stringstream traceMsg;
72         traceMsg << file.getPath().c_str() << " only " << (int)numBytes
73                  << " of " << (int)i_size << " bytes written";
74         auto strobj = traceMsg.str();
75         trace<level::ERROR>(strobj.c_str());
76     }
77 
78     lseek(fd, 0, SEEK_SET);
79 
80     return file;
81 }
82 
83 /**
84  * @brief Create an FFDCFile object containing the specified lines of text data
85  *
86  * Throws an exception if an error occurs.
87  *
88  * @param   lines - lines of text data to write to file
89  * @return  FFDCFile object
90  */
91 util::FFDCFile createFFDCTraceFile(const std::vector<std::string>& lines)
92 {
93     // Create FFDC file of type Text
94     util::FFDCFile file{util::FFDCFormat::Text};
95     int fd = file.getFileDescriptor();
96 
97     // Write FFDC lines to file
98     std::string buffer;
99     for (const std::string& line : lines)
100     {
101         // Copy line to buffer.  Add newline if necessary.
102         buffer = line;
103         if (line.empty() || (line.back() != '\n'))
104         {
105             buffer += '\n';
106         }
107 
108         // write buffer to file
109         size_t numBytes = write(fd, buffer.c_str(), buffer.size());
110         if (buffer.size() != numBytes)
111         {
112             std::stringstream traceMsg;
113             traceMsg << file.getPath().c_str() << " only " << (int)numBytes
114                      << " of " << (int)buffer.size() << " bytes written";
115             auto strobj = traceMsg.str();
116             trace<level::ERROR>(strobj.c_str());
117         }
118     }
119 
120     // Seek to beginning of file so error logging system can read data
121     lseek(fd, 0, SEEK_SET);
122 
123     return file;
124 }
125 
126 /**
127  * Create FDDC files from journal messages of relevant executables
128  *
129  * Parse the system journal looking for log entries created by the executables
130  * of interest for logging. For each of these entries create a ffdc trace file
131  * that will be used to create ffdc log entries. These files will be pushed
132  * onto the stack of ffdc files.
133  *
134  * @param   i_files - vector of ffdc files that will become log entries
135  */
136 void createFFDCTraceFiles(std::vector<util::FFDCFile>& i_files)
137 {
138     // Executables of interest
139     std::vector<std::string> executables{"openpower-hw-diags"};
140 
141     for (const std::string& executable : executables)
142     {
143         try
144         {
145             // get journal messages
146             std::vector<std::string> messages =
147                 sdjGetMessages("SYSLOG_IDENTIFIER", executable, 30);
148 
149             // Create FFDC file containing the journal messages
150             if (!messages.empty())
151             {
152                 i_files.emplace_back(createFFDCTraceFile(messages));
153             }
154         }
155         catch (const std::exception& e)
156         {
157             trace<level::INFO>("createFFDCTraceFiles exception");
158             std::string traceMsg = std::string(e.what(), maxTraceLen);
159             trace<level::INFO>(traceMsg.c_str());
160         }
161     }
162 }
163 
164 /**
165  * Create FFDCFile objects containing debug data to store in the error log.
166  *
167  * If an error occurs, the error is written to the journal but an exception
168  * is not thrown.
169  *
170  * @param   i_buffer - raw data (if creating raw dump ffdc entry in log)
171  * @return  vector of FFDCFile objects
172  */
173 std::vector<util::FFDCFile> createFFDCFiles(char* i_buffer = nullptr,
174                                             size_t i_size  = 0)
175 {
176     std::vector<util::FFDCFile> files{};
177 
178     // Create raw dump file
179     if ((nullptr != i_buffer) && (0 != i_size))
180     {
181         files.emplace_back(createFFDCRawFile(i_buffer, i_size));
182     }
183 
184     // Create trace dump file
185     createFFDCTraceFiles(files);
186 
187     return files;
188 }
189 
190 /**
191  * Create a PEL from an existing PEL
192  *
193  * Create a new PEL based on the specified raw PEL and submit the new PEL
194  * to the backend logging code as a raw PEL. Note that  additional data map
195  * here contains data to be committed to the PEL and it can also be used to
196  * create the PEL as it contains needed information.
197  *
198  * @param   i_buffer - buffer containing a raw PEL
199  * @param   i_additional - additional data to be added to the new PEL
200  */
201 void createPelCustom(std::vector<uint8_t>& i_rawPel,
202                      std::map<std::string, std::string> i_additional)
203 {
204     // create PEL object from buffer
205     auto tiPel = std::make_unique<pel::PelMinimal>(i_rawPel);
206 
207     // The additional data contains the TI info as well as the value for the
208     // subystem that provided the TI info. Get the subystem from additional
209     // data and then populate the prmary SRC and SRC words for the custom PEL
210     // based on the sybsystem's TI info.
211     uint8_t subsystem = std::stoi(i_additional["Subsystem"]);
212     tiPel->setSubsystem(subsystem);
213 
214     if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) == subsystem)
215     {
216         // populate hypervisor SRC words
217         tiPel->setSrcWords(std::array<uint32_t, pel::numSrcWords>{
218             (uint32_t)std::stoul(i_additional["0x10 SRC Word 12"], 0, 16),
219             (uint32_t)std::stoul(i_additional["0x14 SRC Word 13"], 0, 16),
220             (uint32_t)std::stoul(i_additional["0x18 SRC Word 14"], 0, 16),
221             (uint32_t)std::stoul(i_additional["0x1c SRC Word 15"], 0, 16),
222             (uint32_t)std::stoul(i_additional["0x20 SRC Word 16"], 0, 16),
223             (uint32_t)std::stoul(i_additional["0x24 SRC Word 17"], 0, 16),
224             (uint32_t)std::stoul(i_additional["0x28 SRC Word 18"], 0, 16),
225             (uint32_t)std::stoul(i_additional["0x2c SRC Word 19"], 0, 16)});
226 
227         // Populate phyp primary SRC
228 
229         // char array for raw pel src
230         std::array<char, pel::asciiStringSize> srcChars{'0'};
231 
232         // src from TI info
233         std::string srcString = i_additional["SrcAscii"];
234 
235         // copy from string to char array
236         srcString.copy(srcChars.data(),
237                        std::min(srcString.size(), pel::asciiStringSize), 0);
238 
239         tiPel->setAsciiString(srcChars); // pel object src is char array
240 
241         // set symptom-id
242         auto symptomId = (i_additional["SrcAscii"].substr(0, 8) + '_');
243 
244         symptomId += (i_additional["0x10 SRC Word 12"]);
245         symptomId += (i_additional["0x14 SRC Word 13"] + '_');
246         symptomId += (i_additional["0x18 SRC Word 14"]);
247         symptomId += (i_additional["0x1c SRC Word 15"] + '_');
248         symptomId += (i_additional["0x20 SRC Word 16"]);
249         symptomId += (i_additional["0x24 SRC Word 17"] + '_');
250         symptomId += (i_additional["0x28 SRC Word 18"]);
251         symptomId += (i_additional["0x2c SRC Word 19"]);
252 
253         // setSymptomId will take care of required null-terminate and padding
254         tiPel->setSymptomId(symptomId);
255     }
256     else
257     {
258         // Populate hostboot SRC words - note HB word 0 from the shared info
259         // data (additional data "0x10 HB Word") is reflected in the PEL as
260         // "reason code" so we zero it here. Also note that the first word
261         // in this group of words starts at word 0 and word 1 does not exits.
262         tiPel->setSrcWords(std::array<uint32_t, pel::numSrcWords>{
263             (uint32_t)0x00000000,
264             (uint32_t)std::stoul(i_additional["0x14 HB Word 2"], 0, 16),
265             (uint32_t)std::stoul(i_additional["0x18 HB Word 3"], 0, 16),
266             (uint32_t)std::stoul(i_additional["0x1c HB Word 4"], 0, 16),
267             (uint32_t)std::stoul(i_additional["0x20 HB Word 5"], 0, 16),
268             (uint32_t)std::stoul(i_additional["0x24 HB Word 6"], 0, 16),
269             (uint32_t)std::stoul(i_additional["0x28 HB Word 7"], 0, 16),
270             (uint32_t)std::stoul(i_additional["0x2c HB Word 8"], 0, 16)});
271 
272         // Populate hostboot primary SRC
273 
274         // char array for raw pel src
275         std::array<char, pel::asciiStringSize> srcChars{'0'};
276 
277         // src from TI info
278         std::string srcString = i_additional["SrcAscii"];
279 
280         // copy from string to char array
281         srcString.copy(srcChars.data(),
282                        std::min(srcString.size(), pel::asciiStringSize), 0);
283 
284         tiPel->setAsciiString(srcChars); // pel object src is char array
285 
286         // set symptom-id
287         auto symptomId = (i_additional["SrcAscii"].substr(0, 8) + '_');
288 
289         symptomId += (i_additional["0x10 HB Word 0"]);       // note: word 1
290         symptomId += (i_additional["0x14 HB Word 2"] + '_'); // does not exist
291         symptomId += (i_additional["0x18 HB Word 3"]);
292         symptomId += (i_additional["0x1c HB Word 4"] + '_');
293         symptomId += (i_additional["0x20 HB Word 5"]);
294         symptomId += (i_additional["0x24 HB Word 6"] + '_');
295         symptomId += (i_additional["0x28 HB Word 7"]);
296         symptomId += (i_additional["0x2c HB Word 8"]);
297 
298         // setSymptomId will take care of required null-terminate and padding
299         tiPel->setSymptomId(symptomId);
300     }
301 
302     // set severity, event type and action flags
303     tiPel->setSeverity(static_cast<uint8_t>(pel::Severity::termination));
304     tiPel->setType(static_cast<uint8_t>(pel::EventType::na));
305     tiPel->setAction(static_cast<uint16_t>(pel::ActionFlags::service |
306                                            pel::ActionFlags::report |
307                                            pel::ActionFlags::call));
308 
309     // The raw PEL that we used as the basis for this custom PEL contains the
310     // attention handler trace data and does not needed to be in this PEL so
311     // we remove it here.
312     tiPel->setSectionCount(tiPel->getSectionCount() - 1);
313 
314     // Update the raw PEL with the new custom PEL data
315     tiPel->raw(i_rawPel);
316 
317     // create PEL from raw data
318     createPelRaw(i_rawPel);
319 }
320 
321 /**
322  * Log an event handled by the attention handler
323  *
324  * Basic (non TI) events will generate a standard message-registry based PEL
325  *
326  * TI events will create two PEL's. One PEL will be informational and will
327  * contain trace information relevent to attention handler. The second PEL
328  * will be specific to the TI type (including the primary SRC) and will be
329  * based off of the TI information provided to the attention handler through
330  * shared TI info data area.
331  *
332  * @param  i_event - The event type
333  * @param  i_additional - Additional PEL data
334  * @param  i_ffdc - FFDC PEL data
335  * @return Event log Id (0 if no event log generated)
336  */
337 uint32_t event(EventType i_event,
338                std::map<std::string, std::string>& i_additional,
339                const std::vector<util::FFDCFile>& i_ffdc)
340 {
341     uint32_t pelId = 0; // assume no event log generated
342 
343     bool eventValid = false; // assume no event created
344     bool tiEvent    = false; // assume not a terminate event
345 
346     std::string eventName;
347 
348     switch (i_event)
349     {
350         case EventType::Checkstop:
351             eventName  = "org.open_power.HwDiags.Error.Checkstop";
352             eventValid = true;
353             break;
354         case EventType::Terminate:
355             eventName  = "org.open_power.Attn.Error.Terminate";
356             eventValid = true;
357             tiEvent    = true;
358             break;
359         case EventType::Vital:
360             eventName  = "org.open_power.Attn.Error.Vital";
361             eventValid = true;
362             break;
363         case EventType::HwDiagsFail:
364         case EventType::AttentionFail:
365             eventName  = "org.open_power.Attn.Error.Fail";
366             eventValid = true;
367             break;
368         case EventType::PhalSbeChipop:
369             eventName  = "org.open_power.Processor.Error.SbeChipOpFailure";
370             eventValid = true;
371             break;
372         default:
373             eventValid = false;
374             break;
375     }
376 
377     if (true == eventValid)
378     {
379         // Create PEL with additional data and FFDC data. The newly created
380         // PEL's platform log-id will be returned.
381         pelId = createPel(eventName, i_additional, createFFDCTuples(i_ffdc));
382 
383         // If this is a TI event we will create an additional PEL that is
384         // specific to the subsystem that generated the TI.
385         if ((true == tiEvent) && (0 != pelId))
386         {
387             // get file descriptor and size of information PEL
388             int pelFd = getPel(pelId);
389 
390             // if PEL found, read into buffer
391             if (-1 != pelFd)
392             {
393                 auto pelSize = lseek(pelFd, 0, SEEK_END);
394                 lseek(pelFd, 0, SEEK_SET);
395 
396                 // read information PEL into buffer
397                 std::vector<uint8_t> buffer(pelSize);
398                 size_t numBytes = read(pelFd, buffer.data(), buffer.size());
399                 if (buffer.size() != numBytes)
400                 {
401                     std::stringstream traceMsg;
402                     traceMsg << "Error reading event log: " << (int)numBytes
403                              << " of " << (int)buffer.size() << " bytes read";
404                     auto strobj = traceMsg.str();
405                     trace<level::ERROR>(strobj.c_str());
406                 }
407                 else
408                 {
409                     // create PEL from buffer
410                     createPelCustom(buffer, i_additional);
411                 }
412 
413                 close(pelFd);
414             }
415 
416             uint8_t subsystem = std::stoi(i_additional["Subsystem"]);
417 
418             // If not hypervisor TI
419             if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) != subsystem)
420             {
421                 // Request a dump and transition the host
422                 if ("true" == i_additional["Dump"])
423                 {
424                     // will not return until dump is complete
425                     requestDump(DumpParameters{pelId, 0, DumpType::Hostboot});
426                 }
427             }
428         }
429     }
430     return pelId;
431 }
432 
433 /**
434  * Commit special attention TI event to log
435  *
436  * Create a event log with provided additional information and standard
437  * FFDC data plus TI FFDC data
438  *
439  * @param i_additional - Additional log data
440  * @param i_ti_InfoData - TI FFDC data
441  */
442 void eventTerminate(std::map<std::string, std::string> i_additionalData,
443                     char* i_tiInfoData)
444 {
445 
446     uint32_t tiInfoSize = 0; // assume TI info was not available
447 
448     if (nullptr != i_tiInfoData)
449     {
450         tiInfoSize = 56; // assume not hypervisor TI
451 
452         uint8_t subsystem = std::stoi(i_additionalData["Subsystem"]);
453 
454         // If hypervisor
455         if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) == subsystem)
456         {
457             tiInfoSize = 1024; // assume hypervisor max
458 
459             // hypervisor may just want some of the data
460             if (0 == (*(i_tiInfoData + 0x09) & 0x01))
461             {
462                 uint32_t* additionalLength = (uint32_t*)(i_tiInfoData + 0x50);
463                 uint32_t tiAdditional      = be32toh(*additionalLength);
464                 tiInfoSize = std::min(tiInfoSize, (84 + tiAdditional));
465             }
466         }
467     }
468 
469     std::string traceMsg = "TI info size = " + std::to_string(tiInfoSize);
470     trace<level::INFO>(traceMsg.c_str());
471 
472     event(EventType::Terminate, i_additionalData,
473           createFFDCFiles(i_tiInfoData, tiInfoSize));
474 }
475 
476 /** @brief Commit SBE vital event to log, returns event log ID */
477 uint32_t eventVital()
478 {
479     // Additional data for log
480     std::map<std::string, std::string> additionalData;
481 
482     // Create log event with additional data and FFDC data
483     return event(EventType::Vital, additionalData, createFFDCFiles(nullptr, 0));
484 }
485 
486 /**
487  * Commit attention handler failure event to log
488  *
489  * Create an event log containing the specified error code.
490  *
491  * @param i_error - Error code
492  */
493 void eventAttentionFail(int i_error)
494 {
495     // Additional data for log
496     std::map<std::string, std::string> additionalData;
497     additionalData["ERROR_CODE"] = std::to_string(i_error);
498 
499     // Create log event with additional data and FFDC data
500     event(EventType::AttentionFail, additionalData,
501           createFFDCFiles(nullptr, 0));
502 }
503 
504 /**
505  * Commit SBE timeout event to log
506  *
507  * Create an event log indicating an SBE operation timed out.
508  *
509  * @param proc - processor that encountered the error
510  */
511 void eventPhalSbeChipop(uint32_t proc)
512 {
513     trace<level::ERROR>("SBE error while getting TI info");
514 
515     // report proc number in event log entry
516     std::map<std::string, std::string> additionalData;
517     additionalData.emplace("SRC6", std::to_string(proc << 16));
518 
519     // create event with additional data and no ffdc
520     event(EventType::PhalSbeChipop, additionalData,
521           createFFDCFiles(nullptr, 0));
522 }
523 
524 /**
525  * Parse systemd journal message field
526  *
527  * Parse the journal looking for the specified field and return the journal
528  * data for that field.
529  *
530  * @param  journal - The journal to parse
531  * @param  field - Field containing the data to retrieve
532  * @return Data for the speciefied field
533  */
534 std::string sdjGetFieldValue(sd_journal* journal, const char* field)
535 {
536     const char* data{nullptr};
537     size_t length{0};
538 
539     // get field value
540     if (0 == sd_journal_get_data(journal, field, (const void**)&data, &length))
541     {
542         size_t prefix{0};
543 
544         // The data returned  by sd_journal_get_data will be prefixed with the
545         // field name and "="
546         const void* eq = memchr(data, '=', length);
547         if (nullptr != eq)
548         {
549             // get just data following the "="
550             prefix = (const char*)eq - data + 1;
551         }
552         else
553         {
554             // all the data (should not happen)
555             prefix = 0;
556             std::string value{}; // empty string
557         }
558 
559         return std::string{data + prefix, length - prefix};
560     }
561     else
562     {
563         return std::string{}; // empty string
564     }
565 }
566 
567 /**
568  * Gather messages from the journal
569  *
570  * Fetch journal entry data for all entries with the specified field equal to
571  * the specified value.
572  *
573  * @param   field - Field to search on
574  * @param   fieldValue -  Value to search for
575  * @param   max - Maximum number of messages fetch
576  * @return  Vector of journal entry data
577  */
578 std::vector<std::string> sdjGetMessages(const std::string& field,
579                                         const std::string& fieldValue,
580                                         unsigned int max)
581 {
582     sd_journal* journal;
583     std::vector<std::string> messages;
584 
585     if (0 == sd_journal_open(&journal, SD_JOURNAL_LOCAL_ONLY))
586     {
587         SD_JOURNAL_FOREACH_BACKWARDS(journal)
588         {
589             // Get input field
590             std::string value = sdjGetFieldValue(journal, field.c_str());
591 
592             // Compare field value and read data
593             if (value == fieldValue)
594             {
595                 // Get SYSLOG_IDENTIFIER field (process that logged message)
596                 std::string syslog =
597                     sdjGetFieldValue(journal, "SYSLOG_IDENTIFIER");
598 
599                 // Get _PID field
600                 std::string pid = sdjGetFieldValue(journal, "_PID");
601 
602                 // Get MESSAGE field
603                 std::string message = sdjGetFieldValue(journal, "MESSAGE");
604 
605                 // Get timestamp
606                 uint64_t usec{0};
607                 if (0 == sd_journal_get_realtime_usec(journal, &usec))
608                 {
609 
610                     // Convert realtime microseconds to date format
611                     char dateBuffer[80];
612                     std::string date;
613                     std::time_t timeInSecs = usec / 1000000;
614                     strftime(dateBuffer, sizeof(dateBuffer), "%b %d %H:%M:%S",
615                              std::localtime(&timeInSecs));
616                     date = dateBuffer;
617 
618                     // Store value to messages
619                     value = date + " " + syslog + "[" + pid + "]: " + message;
620                     messages.insert(messages.begin(), value);
621                 }
622             }
623 
624             // limit maximum number of messages
625             if (messages.size() >= max)
626             {
627                 break;
628             }
629         }
630 
631         sd_journal_close(journal); // close journal when done
632     }
633 
634     return messages;
635 }
636 
637 } // namespace attn
638