1 #include <unistd.h>
2 
3 #include <attn/attn_common.hpp>
4 #include <attn/attn_dbus.hpp>
5 #include <attn/attn_logging.hpp>
6 #include <attn/pel/pel_minimal.hpp>
7 #include <attn/ti_handler.hpp>
8 #include <phosphor-logging/log.hpp>
9 
10 namespace attn
11 {
12 
13 /** @brief Journal entry of type INFO using phosphor logging */
14 template <>
15 void trace<INFO>(const char* i_message)
16 {
17     phosphor::logging::log<phosphor::logging::level::INFO>(i_message);
18 }
19 
20 template <>
21 void trace<ERROR>(const char* i_message)
22 {
23     phosphor::logging::log<phosphor::logging::level::ERR>(i_message);
24 }
25 
26 /** @brief Tuple containing information about ffdc files */
27 using FFDCTuple =
28     std::tuple<util::FFDCFormat, uint8_t, uint8_t, sdbusplus::message::unix_fd>;
29 
30 /** @brief Gather messages from the journal */
31 std::vector<std::string> sdjGetMessages(const std::string& field,
32                                         const std::string& fieldValue,
33                                         unsigned int max);
34 
35 /**
36  * Create FFDCTuple objects corresponding to the specified FFDC files.
37  *
38  * The D-Bus method to create an error log requires a vector of tuples to
39  * pass in the FFDC file information.
40  *
41  * @param   files - FFDC files
42  * @return  vector of FFDCTuple objects
43  */
44 std::vector<FFDCTuple>
45     createFFDCTuples(const std::vector<util::FFDCFile>& files)
46 {
47     std::vector<FFDCTuple> ffdcTuples{};
48     util::transformFFDC(files, ffdcTuples);
49 
50     return ffdcTuples;
51 }
52 
53 /**
54  * @brief Create an FFDCFile object containing raw data
55  *
56  * Throws an exception if an error occurs.
57  *
58  * @param   i_buffer - raw data to add to ffdc faw data file
59  * @param   i_size - size of the raw data
60  * @return  FFDCFile object
61  */
62 util::FFDCFile createFFDCRawFile(void* i_buffer, size_t i_size)
63 {
64     util::FFDCFile file{util::FFDCFormat::Custom};
65 
66     // Write buffer to file and then reset file description file offset
67     int fd          = file.getFileDescriptor();
68     size_t numBytes = write(fd, static_cast<char*>(i_buffer), i_size);
69     if (i_size != numBytes)
70     {
71         std::stringstream traceMsg;
72         traceMsg << file.getPath().c_str() << " only " << (int)numBytes
73                  << " of " << (int)i_size << " bytes written";
74         auto strobj = traceMsg.str();
75         trace<level::ERROR>(strobj.c_str());
76     }
77 
78     lseek(fd, 0, SEEK_SET);
79 
80     return file;
81 }
82 
83 /**
84  * @brief Create an FFDCFile object containing the specified lines of text data
85  *
86  * Throws an exception if an error occurs.
87  *
88  * @param   lines - lines of text data to write to file
89  * @return  FFDCFile object
90  */
91 util::FFDCFile createFFDCTraceFile(const std::vector<std::string>& lines)
92 {
93     // Create FFDC file of type Text
94     util::FFDCFile file{util::FFDCFormat::Text};
95     int fd = file.getFileDescriptor();
96 
97     // Write FFDC lines to file
98     std::string buffer;
99     for (const std::string& line : lines)
100     {
101         // Copy line to buffer.  Add newline if necessary.
102         buffer = line;
103         if (line.empty() || (line.back() != '\n'))
104         {
105             buffer += '\n';
106         }
107 
108         // write buffer to file
109         size_t numBytes = write(fd, buffer.c_str(), buffer.size());
110         if (buffer.size() != numBytes)
111         {
112             std::stringstream traceMsg;
113             traceMsg << file.getPath().c_str() << " only " << (int)numBytes
114                      << " of " << (int)buffer.size() << " bytes written";
115             auto strobj = traceMsg.str();
116             trace<level::ERROR>(strobj.c_str());
117         }
118     }
119 
120     // Seek to beginning of file so error logging system can read data
121     lseek(fd, 0, SEEK_SET);
122 
123     return file;
124 }
125 
126 /**
127  * Create FDDC files from journal messages of relevant executables
128  *
129  * Parse the system journal looking for log entries created by the executables
130  * of interest for logging. For each of these entries create a ffdc trace file
131  * that will be used to create ffdc log entries. These files will be pushed
132  * onto the stack of ffdc files.
133  *
134  * @param   i_files - vector of ffdc files that will become log entries
135  */
136 void createFFDCTraceFiles(std::vector<util::FFDCFile>& i_files)
137 {
138     // Executables of interest
139     std::vector<std::string> executables{"openpower-hw-diags"};
140 
141     for (const std::string& executable : executables)
142     {
143         try
144         {
145             // get journal messages
146             std::vector<std::string> messages =
147                 sdjGetMessages("SYSLOG_IDENTIFIER", executable, 30);
148 
149             // Create FFDC file containing the journal messages
150             if (!messages.empty())
151             {
152                 i_files.emplace_back(createFFDCTraceFile(messages));
153             }
154         }
155         catch (const std::exception& e)
156         {
157             trace<level::INFO>("createFFDCTraceFiles exception");
158             std::string traceMsg = std::string(e.what(), maxTraceLen);
159             trace<level::INFO>(traceMsg.c_str());
160         }
161     }
162 }
163 
164 /**
165  * Create FFDCFile objects containing debug data to store in the error log.
166  *
167  * If an error occurs, the error is written to the journal but an exception
168  * is not thrown.
169  *
170  * @param   i_buffer - raw data (if creating raw dump ffdc entry in log)
171  * @return  vector of FFDCFile objects
172  */
173 std::vector<util::FFDCFile> createFFDCFiles(char* i_buffer = nullptr,
174                                             size_t i_size  = 0)
175 {
176     std::vector<util::FFDCFile> files{};
177 
178     // Create raw dump file
179     if ((nullptr != i_buffer) && (0 != i_size))
180     {
181         files.emplace_back(createFFDCRawFile(i_buffer, i_size));
182     }
183 
184     // Create trace dump file
185     createFFDCTraceFiles(files);
186 
187     return files;
188 }
189 
190 /**
191  * Create a PEL from an existing PEL
192  *
193  * Create a new PEL based on the specified raw PEL and submit the new PEL
194  * to the backend logging code as a raw PEL. Note that  additional data map
195  * here contains data to be committed to the PEL and it can also be used to
196  * create the PEL as it contains needed information.
197  *
198  * @param   i_buffer - buffer containing a raw PEL
199  * @param   i_additional - additional data to be added to the new PEL
200  */
201 void createPelCustom(std::vector<uint8_t>& i_rawPel,
202                      std::map<std::string, std::string> i_additional)
203 {
204     // create PEL object from buffer
205     auto tiPel = std::make_unique<pel::PelMinimal>(i_rawPel);
206 
207     // The additional data contains the TI info as well as the value for the
208     // subystem that provided the TI info. Get the subystem from additional
209     // data and then populate the prmary SRC and SRC words for the custom PEL
210     // based on the sybsystem's TI info.
211     uint8_t subsystem = std::stoi(i_additional["Subsystem"]);
212     tiPel->setSubsystem(subsystem);
213 
214     if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) == subsystem)
215     {
216         // populate hypervisor SRC words
217         tiPel->setSrcWords(std::array<uint32_t, pel::numSrcWords>{
218             (uint32_t)std::stoul(i_additional["0x10 SRC Word 12"], 0, 16),
219             (uint32_t)std::stoul(i_additional["0x14 SRC Word 13"], 0, 16),
220             (uint32_t)std::stoul(i_additional["0x18 SRC Word 14"], 0, 16),
221             (uint32_t)std::stoul(i_additional["0x1c SRC Word 15"], 0, 16),
222             (uint32_t)std::stoul(i_additional["0x20 SRC Word 16"], 0, 16),
223             (uint32_t)std::stoul(i_additional["0x24 SRC Word 17"], 0, 16),
224             (uint32_t)std::stoul(i_additional["0x28 SRC Word 18"], 0, 16),
225             (uint32_t)std::stoul(i_additional["0x2c SRC Word 19"], 0, 16)});
226 
227         // Populate phyp primary SRC
228 
229         // char array for raw pel src
230         std::array<char, pel::asciiStringSize> srcChars{'0'};
231 
232         // src from TI info
233         std::string srcString = i_additional["SrcAscii"];
234 
235         // copy from string to char array
236         srcString.copy(srcChars.data(),
237                        std::min(srcString.size(), pel::asciiStringSize), 0);
238 
239         tiPel->setAsciiString(srcChars); // pel object src is char array
240 
241         // set symptom-id
242         auto symptomId = (i_additional["SrcAscii"].substr(0, 8) + '_');
243 
244         symptomId += (i_additional["0x10 SRC Word 12"]);
245         symptomId += (i_additional["0x14 SRC Word 13"] + '_');
246         symptomId += (i_additional["0x18 SRC Word 14"]);
247         symptomId += (i_additional["0x1c SRC Word 15"] + '_');
248         symptomId += (i_additional["0x20 SRC Word 16"]);
249         symptomId += (i_additional["0x24 SRC Word 17"] + '_');
250         symptomId += (i_additional["0x28 SRC Word 18"]);
251         symptomId += (i_additional["0x2c SRC Word 19"]);
252 
253         // setSymptomId will take care of required null-terminate and padding
254         tiPel->setSymptomId(symptomId);
255     }
256     else
257     {
258         // Populate hostboot SRC words - note HB word 0 from the shared info
259         // data (additional data "0x10 HB Word") is reflected in the PEL as
260         // "reason code" so we zero it here. Also note that the first word
261         // in this group of words starts at word 0 and word 1 does not exits.
262         tiPel->setSrcWords(std::array<uint32_t, pel::numSrcWords>{
263             (uint32_t)0x00000000,
264             (uint32_t)std::stoul(i_additional["0x14 HB Word 2"], 0, 16),
265             (uint32_t)std::stoul(i_additional["0x18 HB Word 3"], 0, 16),
266             (uint32_t)std::stoul(i_additional["0x1c HB Word 4"], 0, 16),
267             (uint32_t)std::stoul(i_additional["0x20 HB Word 5"], 0, 16),
268             (uint32_t)std::stoul(i_additional["0x24 HB Word 6"], 0, 16),
269             (uint32_t)std::stoul(i_additional["0x28 HB Word 7"], 0, 16),
270             (uint32_t)std::stoul(i_additional["0x2c HB Word 8"], 0, 16)});
271 
272         // Populate hostboot primary SRC
273 
274         // char array for raw pel src
275         std::array<char, pel::asciiStringSize> srcChars{'0'};
276 
277         // src from TI info
278         std::string srcString = i_additional["SrcAscii"];
279 
280         // copy from string to char array
281         srcString.copy(srcChars.data(),
282                        std::min(srcString.size(), pel::asciiStringSize), 0);
283 
284         tiPel->setAsciiString(srcChars); // pel object src is char array
285 
286         // set symptom-id
287         auto symptomId = (i_additional["SrcAscii"].substr(0, 8) + '_');
288 
289         symptomId += (i_additional["0x10 HB Word 0"]);       // note: word 1
290         symptomId += (i_additional["0x14 HB Word 2"] + '_'); // does not exist
291         symptomId += (i_additional["0x18 HB Word 3"]);
292         symptomId += (i_additional["0x1c HB Word 4"] + '_');
293         symptomId += (i_additional["0x20 HB Word 5"]);
294         symptomId += (i_additional["0x24 HB Word 6"] + '_');
295         symptomId += (i_additional["0x28 HB Word 7"]);
296         symptomId += (i_additional["0x2c HB Word 8"]);
297 
298         // setSymptomId will take care of required null-terminate and padding
299         tiPel->setSymptomId(symptomId);
300     }
301 
302     // set severity, event type and action flags
303     tiPel->setSeverity(static_cast<uint8_t>(pel::Severity::termination));
304     tiPel->setType(static_cast<uint8_t>(pel::EventType::na));
305     tiPel->setAction(static_cast<uint16_t>(pel::ActionFlags::service |
306                                            pel::ActionFlags::report |
307                                            pel::ActionFlags::call));
308 
309     // The raw PEL that we used as the basis for this custom PEL contains the
310     // attention handler trace data and does not needed to be in this PEL so
311     // we remove it here.
312     tiPel->setSectionCount(tiPel->getSectionCount() - 1);
313 
314     // Update the raw PEL with the new custom PEL data
315     tiPel->raw(i_rawPel);
316 
317     // create PEL from raw data
318     createPelRaw(i_rawPel);
319 }
320 
321 /**
322  * Log an event handled by the attention handler
323  *
324  * Basic (non TI) events will generate a standard message-registry based PEL
325  *
326  * TI events will create two PEL's. One PEL will be informational and will
327  * contain trace information relevent to attention handler. The second PEL
328  * will be specific to the TI type (including the primary SRC) and will be
329  * based off of the TI information provided to the attention handler through
330  * shared TI info data area.
331  *
332  * @param  i_event - The event type
333  * @param  i_additional - Additional PEL data
334  * @param  i_ffdc - FFDC PEL data
335  */
336 void event(EventType i_event, std::map<std::string, std::string>& i_additional,
337            const std::vector<util::FFDCFile>& i_ffdc)
338 {
339     bool eventValid = false; // assume no event created
340     bool tiEvent    = false; // assume not a terminate event
341 
342     std::string eventName;
343 
344     switch (i_event)
345     {
346         case EventType::Checkstop:
347             eventName  = "org.open_power.HwDiags.Error.Checkstop";
348             eventValid = true;
349             break;
350         case EventType::Terminate:
351             eventName  = "org.open_power.Attn.Error.Terminate";
352             eventValid = true;
353             tiEvent    = true;
354             break;
355         case EventType::Vital:
356             eventName  = "org.open_power.Attn.Error.Vital";
357             eventValid = true;
358             break;
359         case EventType::HwDiagsFail:
360         case EventType::AttentionFail:
361             eventName  = "org.open_power.Attn.Error.Fail";
362             eventValid = true;
363             break;
364         default:
365             eventValid = false;
366             break;
367     }
368 
369     if (true == eventValid)
370     {
371         // Create PEL with additional data and FFDC data. The newly created
372         // PEL's platform log-id will be returned.
373         auto pelId =
374             createPel(eventName, i_additional, createFFDCTuples(i_ffdc));
375 
376         // If this is a TI event we will create an additional PEL that is
377         // specific to the subsystem that generated the TI.
378         if ((true == tiEvent) && (0 != pelId))
379         {
380             // get file descriptor and size of information PEL
381             int pelFd = getPel(pelId);
382 
383             // if PEL found, read into buffer
384             if (-1 != pelFd)
385             {
386                 auto pelSize = lseek(pelFd, 0, SEEK_END);
387                 lseek(pelFd, 0, SEEK_SET);
388 
389                 // read information PEL into buffer
390                 std::vector<uint8_t> buffer(pelSize);
391                 size_t numBytes = read(pelFd, buffer.data(), buffer.size());
392                 if (buffer.size() != numBytes)
393                 {
394                     std::stringstream traceMsg;
395                     traceMsg << "Error reading event log: " << (int)numBytes
396                              << " of " << (int)buffer.size() << " bytes read";
397                     auto strobj = traceMsg.str();
398                     trace<level::ERROR>(strobj.c_str());
399                 }
400                 else
401                 {
402                     // create PEL from buffer
403                     createPelCustom(buffer, i_additional);
404                 }
405 
406                 close(pelFd);
407             }
408 
409             uint8_t subsystem = std::stoi(i_additional["Subsystem"]);
410 
411             // If not hypervisor TI
412             if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) != subsystem)
413             {
414                 // Request a dump and transition the host
415                 if ("true" == i_additional["Dump"])
416                 {
417                     // will not return until dump is complete
418                     requestDump(pelId);
419                 }
420             }
421         }
422     }
423 }
424 
425 /**
426  * Commit special attention TI event to log
427  *
428  * Create a event log with provided additional information and standard
429  * FFDC data plus TI FFDC data
430  *
431  * @param i_additional - Additional log data
432  * @param i_ti_InfoData - TI FFDC data
433  */
434 void eventTerminate(std::map<std::string, std::string> i_additionalData,
435                     char* i_tiInfoData)
436 {
437 
438     uint32_t tiInfoSize = 0; // assume TI info was not available
439 
440     if (nullptr != i_tiInfoData)
441     {
442         tiInfoSize = 56; // assume not hypervisor TI
443 
444         uint8_t subsystem = std::stoi(i_additionalData["Subsystem"]);
445 
446         // If hypervisor
447         if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) == subsystem)
448         {
449             tiInfoSize = 1024; // assume hypervisor max
450 
451             // hypervisor may just want some of the data
452             if (0 == (*(i_tiInfoData + 0x09) & 0x01))
453             {
454                 uint32_t* additionalLength = (uint32_t*)(i_tiInfoData + 0x50);
455                 uint32_t tiAdditional      = be32toh(*additionalLength);
456                 tiInfoSize = std::min(tiInfoSize, (84 + tiAdditional));
457             }
458         }
459     }
460 
461     std::string traceMsg = "TI info size = " + std::to_string(tiInfoSize);
462     trace<level::INFO>(traceMsg.c_str());
463 
464     event(EventType::Terminate, i_additionalData,
465           createFFDCFiles(i_tiInfoData, tiInfoSize));
466 }
467 
468 /** @brief Commit SBE vital event to log */
469 void eventVital()
470 {
471     // Additional data for log
472     std::map<std::string, std::string> additionalData;
473 
474     // Create log event with additional data and FFDC data
475     event(EventType::Vital, additionalData, createFFDCFiles(nullptr, 0));
476 }
477 
478 /**
479  * Commit attention handler failure event to log
480  *
481  * Create an event log containing the specified error code.
482  *
483  * @param i_error - Error code
484  */
485 void eventAttentionFail(int i_error)
486 {
487     // Additional data for log
488     std::map<std::string, std::string> additionalData;
489     additionalData["ERROR_CODE"] = std::to_string(i_error);
490 
491     // Create log event with additional data and FFDC data
492     event(EventType::AttentionFail, additionalData,
493           createFFDCFiles(nullptr, 0));
494 }
495 
496 /**
497  * Parse systemd journal message field
498  *
499  * Parse the journal looking for the specified field and return the journal
500  * data for that field.
501  *
502  * @param  journal - The journal to parse
503  * @param  field - Field containing the data to retrieve
504  * @return Data for the speciefied field
505  */
506 std::string sdjGetFieldValue(sd_journal* journal, const char* field)
507 {
508     const char* data{nullptr};
509     size_t length{0};
510 
511     // get field value
512     if (0 == sd_journal_get_data(journal, field, (const void**)&data, &length))
513     {
514         size_t prefix{0};
515 
516         // The data returned  by sd_journal_get_data will be prefixed with the
517         // field name and "="
518         const void* eq = memchr(data, '=', length);
519         if (nullptr != eq)
520         {
521             // get just data following the "="
522             prefix = (const char*)eq - data + 1;
523         }
524         else
525         {
526             // all the data (should not happen)
527             prefix = 0;
528             std::string value{}; // empty string
529         }
530 
531         return std::string{data + prefix, length - prefix};
532     }
533     else
534     {
535         return std::string{}; // empty string
536     }
537 }
538 
539 /**
540  * Gather messages from the journal
541  *
542  * Fetch journal entry data for all entries with the specified field equal to
543  * the specified value.
544  *
545  * @param   field - Field to search on
546  * @param   fieldValue -  Value to search for
547  * @param   max - Maximum number of messages fetch
548  * @return  Vector of journal entry data
549  */
550 std::vector<std::string> sdjGetMessages(const std::string& field,
551                                         const std::string& fieldValue,
552                                         unsigned int max)
553 {
554     sd_journal* journal;
555     std::vector<std::string> messages;
556 
557     if (0 == sd_journal_open(&journal, SD_JOURNAL_LOCAL_ONLY))
558     {
559         SD_JOURNAL_FOREACH_BACKWARDS(journal)
560         {
561             // Get input field
562             std::string value = sdjGetFieldValue(journal, field.c_str());
563 
564             // Compare field value and read data
565             if (value == fieldValue)
566             {
567                 // Get SYSLOG_IDENTIFIER field (process that logged message)
568                 std::string syslog =
569                     sdjGetFieldValue(journal, "SYSLOG_IDENTIFIER");
570 
571                 // Get _PID field
572                 std::string pid = sdjGetFieldValue(journal, "_PID");
573 
574                 // Get MESSAGE field
575                 std::string message = sdjGetFieldValue(journal, "MESSAGE");
576 
577                 // Get timestamp
578                 uint64_t usec{0};
579                 if (0 == sd_journal_get_realtime_usec(journal, &usec))
580                 {
581 
582                     // Convert realtime microseconds to date format
583                     char dateBuffer[80];
584                     std::string date;
585                     std::time_t timeInSecs = usec / 1000000;
586                     strftime(dateBuffer, sizeof(dateBuffer), "%b %d %H:%M:%S",
587                              std::localtime(&timeInSecs));
588                     date = dateBuffer;
589 
590                     // Store value to messages
591                     value = date + " " + syslog + "[" + pid + "]: " + message;
592                     messages.insert(messages.begin(), value);
593                 }
594             }
595 
596             // limit maximum number of messages
597             if (messages.size() >= max)
598             {
599                 break;
600             }
601         }
602 
603         sd_journal_close(journal); // close journal when done
604     }
605 
606     return messages;
607 }
608 
609 } // namespace attn
610