1 #include <unistd.h> 2 3 #include <attn/attn_common.hpp> 4 #include <attn/attn_dbus.hpp> 5 #include <attn/attn_logging.hpp> 6 #include <attn/pel/pel_minimal.hpp> 7 #include <attn/ti_handler.hpp> 8 #include <phosphor-logging/log.hpp> 9 10 namespace attn 11 { 12 13 /** @brief Journal entry of type INFO using phosphor logging */ 14 template <> 15 void trace<INFO>(const char* i_message) 16 { 17 phosphor::logging::log<phosphor::logging::level::INFO>(i_message); 18 } 19 20 template <> 21 void trace<ERROR>(const char* i_message) 22 { 23 phosphor::logging::log<phosphor::logging::level::ERR>(i_message); 24 } 25 26 /** @brief Tuple containing information about ffdc files */ 27 using FFDCTuple = 28 std::tuple<util::FFDCFormat, uint8_t, uint8_t, sdbusplus::message::unix_fd>; 29 30 /** @brief Gather messages from the journal */ 31 std::vector<std::string> sdjGetMessages(const std::string& field, 32 const std::string& fieldValue, 33 unsigned int max); 34 35 /** 36 * Create FFDCTuple objects corresponding to the specified FFDC files. 37 * 38 * The D-Bus method to create an error log requires a vector of tuples to 39 * pass in the FFDC file information. 40 * 41 * @param files - FFDC files 42 * @return vector of FFDCTuple objects 43 */ 44 std::vector<FFDCTuple> 45 createFFDCTuples(const std::vector<util::FFDCFile>& files) 46 { 47 std::vector<FFDCTuple> ffdcTuples{}; 48 util::transformFFDC(files, ffdcTuples); 49 50 return ffdcTuples; 51 } 52 53 /** 54 * @brief Create an FFDCFile object containing raw data 55 * 56 * Throws an exception if an error occurs. 57 * 58 * @param i_buffer - raw data to add to ffdc faw data file 59 * @param i_size - size of the raw data 60 * @return FFDCFile object 61 */ 62 util::FFDCFile createFFDCRawFile(void* i_buffer, size_t i_size) 63 { 64 util::FFDCFile file{util::FFDCFormat::Custom}; 65 66 // Write buffer to file and then reset file description file offset 67 int fd = file.getFileDescriptor(); 68 size_t numBytes = write(fd, static_cast<char*>(i_buffer), i_size); 69 if (i_size != numBytes) 70 { 71 std::stringstream traceMsg; 72 traceMsg << file.getPath().c_str() << " only " << (int)numBytes 73 << " of " << (int)i_size << " bytes written"; 74 auto strobj = traceMsg.str(); 75 trace<level::ERROR>(strobj.c_str()); 76 } 77 78 lseek(fd, 0, SEEK_SET); 79 80 return file; 81 } 82 83 /** 84 * @brief Create an FFDCFile object containing the specified lines of text data 85 * 86 * Throws an exception if an error occurs. 87 * 88 * @param lines - lines of text data to write to file 89 * @return FFDCFile object 90 */ 91 util::FFDCFile createFFDCTraceFile(const std::vector<std::string>& lines) 92 { 93 // Create FFDC file of type Text 94 util::FFDCFile file{util::FFDCFormat::Text}; 95 int fd = file.getFileDescriptor(); 96 97 // Write FFDC lines to file 98 std::string buffer; 99 for (const std::string& line : lines) 100 { 101 // Copy line to buffer. Add newline if necessary. 102 buffer = line; 103 if (line.empty() || (line.back() != '\n')) 104 { 105 buffer += '\n'; 106 } 107 108 // write buffer to file 109 size_t numBytes = write(fd, buffer.c_str(), buffer.size()); 110 if (buffer.size() != numBytes) 111 { 112 std::stringstream traceMsg; 113 traceMsg << file.getPath().c_str() << " only " << (int)numBytes 114 << " of " << (int)buffer.size() << " bytes written"; 115 auto strobj = traceMsg.str(); 116 trace<level::ERROR>(strobj.c_str()); 117 } 118 } 119 120 // Seek to beginning of file so error logging system can read data 121 lseek(fd, 0, SEEK_SET); 122 123 return file; 124 } 125 126 /** 127 * Create FDDC files from journal messages of relevant executables 128 * 129 * Parse the system journal looking for log entries created by the executables 130 * of interest for logging. For each of these entries create a ffdc trace file 131 * that will be used to create ffdc log entries. These files will be pushed 132 * onto the stack of ffdc files. 133 * 134 * @param i_files - vector of ffdc files that will become log entries 135 */ 136 void createFFDCTraceFiles(std::vector<util::FFDCFile>& i_files) 137 { 138 // Executables of interest 139 std::vector<std::string> executables{"openpower-hw-diags"}; 140 141 for (const std::string& executable : executables) 142 { 143 try 144 { 145 // get journal messages 146 std::vector<std::string> messages = 147 sdjGetMessages("SYSLOG_IDENTIFIER", executable, 30); 148 149 // Create FFDC file containing the journal messages 150 if (!messages.empty()) 151 { 152 i_files.emplace_back(createFFDCTraceFile(messages)); 153 } 154 } 155 catch (const std::exception& e) 156 { 157 trace<level::INFO>("createFFDCTraceFiles exception"); 158 std::string traceMsg = std::string(e.what(), maxTraceLen); 159 trace<level::INFO>(traceMsg.c_str()); 160 } 161 } 162 } 163 164 /** 165 * Create FFDCFile objects containing debug data to store in the error log. 166 * 167 * If an error occurs, the error is written to the journal but an exception 168 * is not thrown. 169 * 170 * @param i_buffer - raw data (if creating raw dump ffdc entry in log) 171 * @return vector of FFDCFile objects 172 */ 173 std::vector<util::FFDCFile> createFFDCFiles(char* i_buffer = nullptr, 174 size_t i_size = 0) 175 { 176 std::vector<util::FFDCFile> files{}; 177 178 // Create raw dump file 179 if ((nullptr != i_buffer) && (0 != i_size)) 180 { 181 files.emplace_back(createFFDCRawFile(i_buffer, i_size)); 182 } 183 184 // Create trace dump file 185 createFFDCTraceFiles(files); 186 187 return files; 188 } 189 190 /** 191 * Create a PEL from an existing PEL 192 * 193 * Create a new PEL based on the specified raw PEL and submit the new PEL 194 * to the backend logging code as a raw PEL. Note that additional data map 195 * here contains data to be committed to the PEL and it can also be used to 196 * create the PEL as it contains needed information. 197 * 198 * @param i_buffer - buffer containing a raw PEL 199 * @param i_additional - additional data to be added to the new PEL 200 */ 201 void createPelCustom(std::vector<uint8_t>& i_rawPel, 202 std::map<std::string, std::string> i_additional) 203 { 204 // create PEL object from buffer 205 auto tiPel = std::make_unique<pel::PelMinimal>(i_rawPel); 206 207 // The additional data contains the TI info as well as the value for the 208 // subystem that provided the TI info. Get the subystem from additional 209 // data and then populate the prmary SRC and SRC words for the custom PEL 210 // based on the sybsystem's TI info. 211 uint8_t subsystem = std::stoi(i_additional["Subsystem"]); 212 tiPel->setSubsystem(subsystem); 213 214 if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) == subsystem) 215 { 216 // populate hypervisor SRC words 217 tiPel->setSrcWords(std::array<uint32_t, pel::numSrcWords>{ 218 (uint32_t)std::stoul(i_additional["0x10 SRC Word 12"], 0, 16), 219 (uint32_t)std::stoul(i_additional["0x14 SRC Word 13"], 0, 16), 220 (uint32_t)std::stoul(i_additional["0x18 SRC Word 14"], 0, 16), 221 (uint32_t)std::stoul(i_additional["0x1c SRC Word 15"], 0, 16), 222 (uint32_t)std::stoul(i_additional["0x20 SRC Word 16"], 0, 16), 223 (uint32_t)std::stoul(i_additional["0x24 SRC Word 17"], 0, 16), 224 (uint32_t)std::stoul(i_additional["0x28 SRC Word 18"], 0, 16), 225 (uint32_t)std::stoul(i_additional["0x2c SRC Word 19"], 0, 16)}); 226 227 // Populate phyp primary SRC 228 229 // char array for raw pel src 230 std::array<char, pel::asciiStringSize> srcChars{'0'}; 231 232 // src from TI info 233 std::string srcString = i_additional["SrcAscii"]; 234 235 // copy from string to char array 236 srcString.copy(srcChars.data(), 237 std::min(srcString.size(), pel::asciiStringSize), 0); 238 239 tiPel->setAsciiString(srcChars); // pel object src is char array 240 241 // set symptom-id 242 auto symptomId = (i_additional["SrcAscii"].substr(0, 8) + '_'); 243 244 symptomId += (i_additional["0x10 SRC Word 12"]); 245 symptomId += (i_additional["0x14 SRC Word 13"] + '_'); 246 symptomId += (i_additional["0x18 SRC Word 14"]); 247 symptomId += (i_additional["0x1c SRC Word 15"] + '_'); 248 symptomId += (i_additional["0x20 SRC Word 16"]); 249 symptomId += (i_additional["0x24 SRC Word 17"] + '_'); 250 symptomId += (i_additional["0x28 SRC Word 18"]); 251 symptomId += (i_additional["0x2c SRC Word 19"]); 252 253 // setSymptomId will take care of required null-terminate and padding 254 tiPel->setSymptomId(symptomId); 255 } 256 else 257 { 258 // Populate hostboot SRC words - note HB word 0 from the shared info 259 // data (additional data "0x10 HB Word") is reflected in the PEL as 260 // "reason code" so we zero it here. Also note that the first word 261 // in this group of words starts at word 0 and word 1 does not exits. 262 tiPel->setSrcWords(std::array<uint32_t, pel::numSrcWords>{ 263 (uint32_t)0x00000000, 264 (uint32_t)std::stoul(i_additional["0x14 HB Word 2"], 0, 16), 265 (uint32_t)std::stoul(i_additional["0x18 HB Word 3"], 0, 16), 266 (uint32_t)std::stoul(i_additional["0x1c HB Word 4"], 0, 16), 267 (uint32_t)std::stoul(i_additional["0x20 HB Word 5"], 0, 16), 268 (uint32_t)std::stoul(i_additional["0x24 HB Word 6"], 0, 16), 269 (uint32_t)std::stoul(i_additional["0x28 HB Word 7"], 0, 16), 270 (uint32_t)std::stoul(i_additional["0x2c HB Word 8"], 0, 16)}); 271 272 // Populate hostboot primary SRC 273 274 // char array for raw pel src 275 std::array<char, pel::asciiStringSize> srcChars{'0'}; 276 277 // src from TI info 278 std::string srcString = i_additional["SrcAscii"]; 279 280 // copy from string to char array 281 srcString.copy(srcChars.data(), 282 std::min(srcString.size(), pel::asciiStringSize), 0); 283 284 tiPel->setAsciiString(srcChars); // pel object src is char array 285 286 // set symptom-id 287 auto symptomId = (i_additional["SrcAscii"].substr(0, 8) + '_'); 288 289 symptomId += (i_additional["0x10 HB Word 0"]); // note: word 1 290 symptomId += (i_additional["0x14 HB Word 2"] + '_'); // does not exist 291 symptomId += (i_additional["0x18 HB Word 3"]); 292 symptomId += (i_additional["0x1c HB Word 4"] + '_'); 293 symptomId += (i_additional["0x20 HB Word 5"]); 294 symptomId += (i_additional["0x24 HB Word 6"] + '_'); 295 symptomId += (i_additional["0x28 HB Word 7"]); 296 symptomId += (i_additional["0x2c HB Word 8"]); 297 298 // setSymptomId will take care of required null-terminate and padding 299 tiPel->setSymptomId(symptomId); 300 } 301 302 // set severity, event type and action flags 303 tiPel->setSeverity(static_cast<uint8_t>(pel::Severity::termination)); 304 tiPel->setType(static_cast<uint8_t>(pel::EventType::na)); 305 tiPel->setAction(static_cast<uint16_t>(pel::ActionFlags::service | 306 pel::ActionFlags::report | 307 pel::ActionFlags::call)); 308 309 // The raw PEL that we used as the basis for this custom PEL contains the 310 // attention handler trace data and does not needed to be in this PEL so 311 // we remove it here. 312 tiPel->setSectionCount(tiPel->getSectionCount() - 1); 313 314 // Update the raw PEL with the new custom PEL data 315 tiPel->raw(i_rawPel); 316 317 // create PEL from raw data 318 createPelRaw(i_rawPel); 319 } 320 321 /** 322 * Log an event handled by the attention handler 323 * 324 * Basic (non TI) events will generate a standard message-registry based PEL 325 * 326 * TI events will create two PEL's. One PEL will be informational and will 327 * contain trace information relevent to attention handler. The second PEL 328 * will be specific to the TI type (including the primary SRC) and will be 329 * based off of the TI information provided to the attention handler through 330 * shared TI info data area. 331 * 332 * @param i_event - The event type 333 * @param i_additional - Additional PEL data 334 * @param i_ffdc - FFDC PEL data 335 */ 336 void event(EventType i_event, std::map<std::string, std::string>& i_additional, 337 const std::vector<util::FFDCFile>& i_ffdc) 338 { 339 bool eventValid = false; // assume no event created 340 bool tiEvent = false; // assume not a terminate event 341 342 std::string eventName; 343 344 switch (i_event) 345 { 346 case EventType::Checkstop: 347 eventName = "org.open_power.HwDiags.Error.Checkstop"; 348 eventValid = true; 349 break; 350 case EventType::Terminate: 351 eventName = "org.open_power.Attn.Error.Terminate"; 352 eventValid = true; 353 tiEvent = true; 354 break; 355 case EventType::Vital: 356 eventName = "org.open_power.Attn.Error.Vital"; 357 eventValid = true; 358 break; 359 case EventType::HwDiagsFail: 360 case EventType::AttentionFail: 361 eventName = "org.open_power.Attn.Error.Fail"; 362 eventValid = true; 363 break; 364 default: 365 eventValid = false; 366 break; 367 } 368 369 if (true == eventValid) 370 { 371 // Create PEL with additional data and FFDC data. The newly created 372 // PEL's platform log-id will be returned. 373 auto pelId = 374 createPel(eventName, i_additional, createFFDCTuples(i_ffdc)); 375 376 // If this is a TI event we will create an additional PEL that is 377 // specific to the subsystem that generated the TI. 378 if ((true == tiEvent) && (0 != pelId)) 379 { 380 // get file descriptor and size of information PEL 381 int pelFd = getPel(pelId); 382 383 // if PEL found, read into buffer 384 if (-1 != pelFd) 385 { 386 auto pelSize = lseek(pelFd, 0, SEEK_END); 387 lseek(pelFd, 0, SEEK_SET); 388 389 // read information PEL into buffer 390 std::vector<uint8_t> buffer(pelSize); 391 size_t numBytes = read(pelFd, buffer.data(), buffer.size()); 392 if (buffer.size() != numBytes) 393 { 394 std::stringstream traceMsg; 395 traceMsg << "Error reading event log: " << (int)numBytes 396 << " of " << (int)buffer.size() << " bytes read"; 397 auto strobj = traceMsg.str(); 398 trace<level::ERROR>(strobj.c_str()); 399 } 400 else 401 { 402 // create PEL from buffer 403 createPelCustom(buffer, i_additional); 404 } 405 406 close(pelFd); 407 } 408 409 uint8_t subsystem = std::stoi(i_additional["Subsystem"]); 410 411 // If not hypervisor TI 412 if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) != subsystem) 413 { 414 // Request a dump and transition the host 415 if ("true" == i_additional["Dump"]) 416 { 417 // will not return until dump is complete 418 requestDump(pelId); 419 } 420 } 421 } 422 } 423 } 424 425 /** 426 * Commit special attention TI event to log 427 * 428 * Create a event log with provided additional information and standard 429 * FFDC data plus TI FFDC data 430 * 431 * @param i_additional - Additional log data 432 * @param i_ti_InfoData - TI FFDC data 433 */ 434 void eventTerminate(std::map<std::string, std::string> i_additionalData, 435 char* i_tiInfoData) 436 { 437 438 uint32_t tiInfoSize = 0; // assume TI info was not available 439 440 if (nullptr != i_tiInfoData) 441 { 442 tiInfoSize = 56; // assume not hypervisor TI 443 444 uint8_t subsystem = std::stoi(i_additionalData["Subsystem"]); 445 446 // If hypervisor 447 if (static_cast<uint8_t>(pel::SubsystemID::hypervisor) == subsystem) 448 { 449 tiInfoSize = 1024; // assume hypervisor max 450 451 // hypervisor may just want some of the data 452 if (0 == (*(i_tiInfoData + 0x09) & 0x01)) 453 { 454 uint32_t* additionalLength = (uint32_t*)(i_tiInfoData + 0x50); 455 uint32_t tiAdditional = be32toh(*additionalLength); 456 tiInfoSize = std::min(tiInfoSize, (84 + tiAdditional)); 457 } 458 } 459 } 460 461 std::string traceMsg = "TI info size = " + std::to_string(tiInfoSize); 462 trace<level::INFO>(traceMsg.c_str()); 463 464 event(EventType::Terminate, i_additionalData, 465 createFFDCFiles(i_tiInfoData, tiInfoSize)); 466 } 467 468 /** @brief Commit SBE vital event to log */ 469 void eventVital() 470 { 471 // Additional data for log 472 std::map<std::string, std::string> additionalData; 473 474 // Create log event with additional data and FFDC data 475 event(EventType::Vital, additionalData, createFFDCFiles(nullptr, 0)); 476 } 477 478 /** 479 * Commit attention handler failure event to log 480 * 481 * Create an event log containing the specified error code. 482 * 483 * @param i_error - Error code 484 */ 485 void eventAttentionFail(int i_error) 486 { 487 // Additional data for log 488 std::map<std::string, std::string> additionalData; 489 additionalData["ERROR_CODE"] = std::to_string(i_error); 490 491 // Create log event with additional data and FFDC data 492 event(EventType::AttentionFail, additionalData, 493 createFFDCFiles(nullptr, 0)); 494 } 495 496 /** 497 * Parse systemd journal message field 498 * 499 * Parse the journal looking for the specified field and return the journal 500 * data for that field. 501 * 502 * @param journal - The journal to parse 503 * @param field - Field containing the data to retrieve 504 * @return Data for the speciefied field 505 */ 506 std::string sdjGetFieldValue(sd_journal* journal, const char* field) 507 { 508 const char* data{nullptr}; 509 size_t length{0}; 510 511 // get field value 512 if (0 == sd_journal_get_data(journal, field, (const void**)&data, &length)) 513 { 514 size_t prefix{0}; 515 516 // The data returned by sd_journal_get_data will be prefixed with the 517 // field name and "=" 518 const void* eq = memchr(data, '=', length); 519 if (nullptr != eq) 520 { 521 // get just data following the "=" 522 prefix = (const char*)eq - data + 1; 523 } 524 else 525 { 526 // all the data (should not happen) 527 prefix = 0; 528 std::string value{}; // empty string 529 } 530 531 return std::string{data + prefix, length - prefix}; 532 } 533 else 534 { 535 return std::string{}; // empty string 536 } 537 } 538 539 /** 540 * Gather messages from the journal 541 * 542 * Fetch journal entry data for all entries with the specified field equal to 543 * the specified value. 544 * 545 * @param field - Field to search on 546 * @param fieldValue - Value to search for 547 * @param max - Maximum number of messages fetch 548 * @return Vector of journal entry data 549 */ 550 std::vector<std::string> sdjGetMessages(const std::string& field, 551 const std::string& fieldValue, 552 unsigned int max) 553 { 554 sd_journal* journal; 555 std::vector<std::string> messages; 556 557 if (0 == sd_journal_open(&journal, SD_JOURNAL_LOCAL_ONLY)) 558 { 559 SD_JOURNAL_FOREACH_BACKWARDS(journal) 560 { 561 // Get input field 562 std::string value = sdjGetFieldValue(journal, field.c_str()); 563 564 // Compare field value and read data 565 if (value == fieldValue) 566 { 567 // Get SYSLOG_IDENTIFIER field (process that logged message) 568 std::string syslog = 569 sdjGetFieldValue(journal, "SYSLOG_IDENTIFIER"); 570 571 // Get _PID field 572 std::string pid = sdjGetFieldValue(journal, "_PID"); 573 574 // Get MESSAGE field 575 std::string message = sdjGetFieldValue(journal, "MESSAGE"); 576 577 // Get timestamp 578 uint64_t usec{0}; 579 if (0 == sd_journal_get_realtime_usec(journal, &usec)) 580 { 581 582 // Convert realtime microseconds to date format 583 char dateBuffer[80]; 584 std::string date; 585 std::time_t timeInSecs = usec / 1000000; 586 strftime(dateBuffer, sizeof(dateBuffer), "%b %d %H:%M:%S", 587 std::localtime(&timeInSecs)); 588 date = dateBuffer; 589 590 // Store value to messages 591 value = date + " " + syslog + "[" + pid + "]: " + message; 592 messages.insert(messages.begin(), value); 593 } 594 } 595 596 // limit maximum number of messages 597 if (messages.size() >= max) 598 { 599 break; 600 } 601 } 602 603 sd_journal_close(journal); // close journal when done 604 } 605 606 return messages; 607 } 608 609 } // namespace attn 610