1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Mediated virtual PCI serial host device driver 4 * 5 * Copyright (c) 2016, NVIDIA CORPORATION. All rights reserved. 6 * Author: Neo Jia <cjia@nvidia.com> 7 * Kirti Wankhede <kwankhede@nvidia.com> 8 * 9 * Sample driver that creates mdev device that simulates serial port over PCI 10 * card. 11 */ 12 13 #include <linux/init.h> 14 #include <linux/module.h> 15 #include <linux/kernel.h> 16 #include <linux/fs.h> 17 #include <linux/poll.h> 18 #include <linux/slab.h> 19 #include <linux/cdev.h> 20 #include <linux/sched.h> 21 #include <linux/wait.h> 22 #include <linux/vfio.h> 23 #include <linux/iommu.h> 24 #include <linux/sysfs.h> 25 #include <linux/ctype.h> 26 #include <linux/file.h> 27 #include <linux/mdev.h> 28 #include <linux/pci.h> 29 #include <linux/serial.h> 30 #include <uapi/linux/serial_reg.h> 31 #include <linux/eventfd.h> 32 /* 33 * #defines 34 */ 35 36 #define VERSION_STRING "0.1" 37 #define DRIVER_AUTHOR "NVIDIA Corporation" 38 39 #define MTTY_CLASS_NAME "mtty" 40 41 #define MTTY_NAME "mtty" 42 43 #define MTTY_STRING_LEN 16 44 45 #define MTTY_CONFIG_SPACE_SIZE 0xff 46 #define MTTY_IO_BAR_SIZE 0x8 47 #define MTTY_MMIO_BAR_SIZE 0x100000 48 49 #define STORE_LE16(addr, val) (*(u16 *)addr = val) 50 #define STORE_LE32(addr, val) (*(u32 *)addr = val) 51 52 #define MAX_FIFO_SIZE 16 53 54 #define CIRCULAR_BUF_INC_IDX(idx) (idx = (idx + 1) & (MAX_FIFO_SIZE - 1)) 55 56 #define MTTY_VFIO_PCI_OFFSET_SHIFT 40 57 58 #define MTTY_VFIO_PCI_OFFSET_TO_INDEX(off) (off >> MTTY_VFIO_PCI_OFFSET_SHIFT) 59 #define MTTY_VFIO_PCI_INDEX_TO_OFFSET(index) \ 60 ((u64)(index) << MTTY_VFIO_PCI_OFFSET_SHIFT) 61 #define MTTY_VFIO_PCI_OFFSET_MASK \ 62 (((u64)(1) << MTTY_VFIO_PCI_OFFSET_SHIFT) - 1) 63 #define MAX_MTTYS 24 64 65 /* 66 * Global Structures 67 */ 68 69 static struct mtty_dev { 70 dev_t vd_devt; 71 struct class *vd_class; 72 struct cdev vd_cdev; 73 struct idr vd_idr; 74 struct device dev; 75 struct mdev_parent parent; 76 } mtty_dev; 77 78 struct mdev_region_info { 79 u64 start; 80 u64 phys_start; 81 u32 size; 82 u64 vfio_offset; 83 }; 84 85 #if defined(DEBUG_REGS) 86 static const char *wr_reg[] = { 87 "TX", 88 "IER", 89 "FCR", 90 "LCR", 91 "MCR", 92 "LSR", 93 "MSR", 94 "SCR" 95 }; 96 97 static const char *rd_reg[] = { 98 "RX", 99 "IER", 100 "IIR", 101 "LCR", 102 "MCR", 103 "LSR", 104 "MSR", 105 "SCR" 106 }; 107 #endif 108 109 /* loop back buffer */ 110 struct rxtx { 111 u8 fifo[MAX_FIFO_SIZE]; 112 u8 head, tail; 113 u8 count; 114 }; 115 116 struct serial_port { 117 u8 uart_reg[8]; /* 8 registers */ 118 struct rxtx rxtx; /* loop back buffer */ 119 bool dlab; 120 bool overrun; 121 u16 divisor; 122 u8 fcr; /* FIFO control register */ 123 u8 max_fifo_size; 124 u8 intr_trigger_level; /* interrupt trigger level */ 125 }; 126 127 /* State of each mdev device */ 128 struct mdev_state { 129 struct vfio_device vdev; 130 int irq_fd; 131 struct eventfd_ctx *intx_evtfd; 132 struct eventfd_ctx *msi_evtfd; 133 int irq_index; 134 u8 *vconfig; 135 struct mutex ops_lock; 136 struct mdev_device *mdev; 137 struct mdev_region_info region_info[VFIO_PCI_NUM_REGIONS]; 138 u32 bar_mask[VFIO_PCI_NUM_REGIONS]; 139 struct list_head next; 140 struct serial_port s[2]; 141 struct mutex rxtx_lock; 142 struct vfio_device_info dev_info; 143 int nr_ports; 144 }; 145 146 static struct mtty_type { 147 struct mdev_type type; 148 int nr_ports; 149 const char *name; 150 } mtty_types[2] = { 151 { .nr_ports = 1, .type.sysfs_name = "1", .name = "Single port serial" }, 152 { .nr_ports = 2, .type.sysfs_name = "2", .name = "Dual port serial" }, 153 }; 154 155 static struct mdev_type *mtty_mdev_types[] = { 156 &mtty_types[0].type, 157 &mtty_types[1].type, 158 }; 159 160 static atomic_t mdev_avail_ports = ATOMIC_INIT(MAX_MTTYS); 161 162 static const struct file_operations vd_fops = { 163 .owner = THIS_MODULE, 164 }; 165 166 static const struct vfio_device_ops mtty_dev_ops; 167 168 /* function prototypes */ 169 170 static int mtty_trigger_interrupt(struct mdev_state *mdev_state); 171 172 /* Helper functions */ 173 174 static void dump_buffer(u8 *buf, uint32_t count) 175 { 176 #if defined(DEBUG) 177 int i; 178 179 pr_info("Buffer:\n"); 180 for (i = 0; i < count; i++) { 181 pr_info("%2x ", *(buf + i)); 182 if ((i + 1) % 16 == 0) 183 pr_info("\n"); 184 } 185 #endif 186 } 187 188 static void mtty_create_config_space(struct mdev_state *mdev_state) 189 { 190 /* PCI dev ID */ 191 STORE_LE32((u32 *) &mdev_state->vconfig[0x0], 0x32534348); 192 193 /* Control: I/O+, Mem-, BusMaster- */ 194 STORE_LE16((u16 *) &mdev_state->vconfig[0x4], 0x0001); 195 196 /* Status: capabilities list absent */ 197 STORE_LE16((u16 *) &mdev_state->vconfig[0x6], 0x0200); 198 199 /* Rev ID */ 200 mdev_state->vconfig[0x8] = 0x10; 201 202 /* programming interface class : 16550-compatible serial controller */ 203 mdev_state->vconfig[0x9] = 0x02; 204 205 /* Sub class : 00 */ 206 mdev_state->vconfig[0xa] = 0x00; 207 208 /* Base class : Simple Communication controllers */ 209 mdev_state->vconfig[0xb] = 0x07; 210 211 /* base address registers */ 212 /* BAR0: IO space */ 213 STORE_LE32((u32 *) &mdev_state->vconfig[0x10], 0x000001); 214 mdev_state->bar_mask[0] = ~(MTTY_IO_BAR_SIZE) + 1; 215 216 if (mdev_state->nr_ports == 2) { 217 /* BAR1: IO space */ 218 STORE_LE32((u32 *) &mdev_state->vconfig[0x14], 0x000001); 219 mdev_state->bar_mask[1] = ~(MTTY_IO_BAR_SIZE) + 1; 220 } 221 222 /* Subsystem ID */ 223 STORE_LE32((u32 *) &mdev_state->vconfig[0x2c], 0x32534348); 224 225 mdev_state->vconfig[0x34] = 0x00; /* Cap Ptr */ 226 mdev_state->vconfig[0x3d] = 0x01; /* interrupt pin (INTA#) */ 227 228 /* Vendor specific data */ 229 mdev_state->vconfig[0x40] = 0x23; 230 mdev_state->vconfig[0x43] = 0x80; 231 mdev_state->vconfig[0x44] = 0x23; 232 mdev_state->vconfig[0x48] = 0x23; 233 mdev_state->vconfig[0x4c] = 0x23; 234 235 mdev_state->vconfig[0x60] = 0x50; 236 mdev_state->vconfig[0x61] = 0x43; 237 mdev_state->vconfig[0x62] = 0x49; 238 mdev_state->vconfig[0x63] = 0x20; 239 mdev_state->vconfig[0x64] = 0x53; 240 mdev_state->vconfig[0x65] = 0x65; 241 mdev_state->vconfig[0x66] = 0x72; 242 mdev_state->vconfig[0x67] = 0x69; 243 mdev_state->vconfig[0x68] = 0x61; 244 mdev_state->vconfig[0x69] = 0x6c; 245 mdev_state->vconfig[0x6a] = 0x2f; 246 mdev_state->vconfig[0x6b] = 0x55; 247 mdev_state->vconfig[0x6c] = 0x41; 248 mdev_state->vconfig[0x6d] = 0x52; 249 mdev_state->vconfig[0x6e] = 0x54; 250 } 251 252 static void handle_pci_cfg_write(struct mdev_state *mdev_state, u16 offset, 253 u8 *buf, u32 count) 254 { 255 u32 cfg_addr, bar_mask, bar_index = 0; 256 257 switch (offset) { 258 case 0x04: /* device control */ 259 case 0x06: /* device status */ 260 /* do nothing */ 261 break; 262 case 0x3c: /* interrupt line */ 263 mdev_state->vconfig[0x3c] = buf[0]; 264 break; 265 case 0x3d: 266 /* 267 * Interrupt Pin is hardwired to INTA. 268 * This field is write protected by hardware 269 */ 270 break; 271 case 0x10: /* BAR0 */ 272 case 0x14: /* BAR1 */ 273 if (offset == 0x10) 274 bar_index = 0; 275 else if (offset == 0x14) 276 bar_index = 1; 277 278 if ((mdev_state->nr_ports == 1) && (bar_index == 1)) { 279 STORE_LE32(&mdev_state->vconfig[offset], 0); 280 break; 281 } 282 283 cfg_addr = *(u32 *)buf; 284 pr_info("BAR%d addr 0x%x\n", bar_index, cfg_addr); 285 286 if (cfg_addr == 0xffffffff) { 287 bar_mask = mdev_state->bar_mask[bar_index]; 288 cfg_addr = (cfg_addr & bar_mask); 289 } 290 291 cfg_addr |= (mdev_state->vconfig[offset] & 0x3ul); 292 STORE_LE32(&mdev_state->vconfig[offset], cfg_addr); 293 break; 294 case 0x18: /* BAR2 */ 295 case 0x1c: /* BAR3 */ 296 case 0x20: /* BAR4 */ 297 STORE_LE32(&mdev_state->vconfig[offset], 0); 298 break; 299 default: 300 pr_info("PCI config write @0x%x of %d bytes not handled\n", 301 offset, count); 302 break; 303 } 304 } 305 306 static void handle_bar_write(unsigned int index, struct mdev_state *mdev_state, 307 u16 offset, u8 *buf, u32 count) 308 { 309 u8 data = *buf; 310 311 /* Handle data written by guest */ 312 switch (offset) { 313 case UART_TX: 314 /* if DLAB set, data is LSB of divisor */ 315 if (mdev_state->s[index].dlab) { 316 mdev_state->s[index].divisor |= data; 317 break; 318 } 319 320 mutex_lock(&mdev_state->rxtx_lock); 321 322 /* save in TX buffer */ 323 if (mdev_state->s[index].rxtx.count < 324 mdev_state->s[index].max_fifo_size) { 325 mdev_state->s[index].rxtx.fifo[ 326 mdev_state->s[index].rxtx.head] = data; 327 mdev_state->s[index].rxtx.count++; 328 CIRCULAR_BUF_INC_IDX(mdev_state->s[index].rxtx.head); 329 mdev_state->s[index].overrun = false; 330 331 /* 332 * Trigger interrupt if receive data interrupt is 333 * enabled and fifo reached trigger level 334 */ 335 if ((mdev_state->s[index].uart_reg[UART_IER] & 336 UART_IER_RDI) && 337 (mdev_state->s[index].rxtx.count == 338 mdev_state->s[index].intr_trigger_level)) { 339 /* trigger interrupt */ 340 #if defined(DEBUG_INTR) 341 pr_err("Serial port %d: Fifo level trigger\n", 342 index); 343 #endif 344 mtty_trigger_interrupt(mdev_state); 345 } 346 } else { 347 #if defined(DEBUG_INTR) 348 pr_err("Serial port %d: Buffer Overflow\n", index); 349 #endif 350 mdev_state->s[index].overrun = true; 351 352 /* 353 * Trigger interrupt if receiver line status interrupt 354 * is enabled 355 */ 356 if (mdev_state->s[index].uart_reg[UART_IER] & 357 UART_IER_RLSI) 358 mtty_trigger_interrupt(mdev_state); 359 } 360 mutex_unlock(&mdev_state->rxtx_lock); 361 break; 362 363 case UART_IER: 364 /* if DLAB set, data is MSB of divisor */ 365 if (mdev_state->s[index].dlab) 366 mdev_state->s[index].divisor |= (u16)data << 8; 367 else { 368 mdev_state->s[index].uart_reg[offset] = data; 369 mutex_lock(&mdev_state->rxtx_lock); 370 if ((data & UART_IER_THRI) && 371 (mdev_state->s[index].rxtx.head == 372 mdev_state->s[index].rxtx.tail)) { 373 #if defined(DEBUG_INTR) 374 pr_err("Serial port %d: IER_THRI write\n", 375 index); 376 #endif 377 mtty_trigger_interrupt(mdev_state); 378 } 379 380 mutex_unlock(&mdev_state->rxtx_lock); 381 } 382 383 break; 384 385 case UART_FCR: 386 mdev_state->s[index].fcr = data; 387 388 mutex_lock(&mdev_state->rxtx_lock); 389 if (data & (UART_FCR_CLEAR_RCVR | UART_FCR_CLEAR_XMIT)) { 390 /* clear loop back FIFO */ 391 mdev_state->s[index].rxtx.count = 0; 392 mdev_state->s[index].rxtx.head = 0; 393 mdev_state->s[index].rxtx.tail = 0; 394 } 395 mutex_unlock(&mdev_state->rxtx_lock); 396 397 switch (data & UART_FCR_TRIGGER_MASK) { 398 case UART_FCR_TRIGGER_1: 399 mdev_state->s[index].intr_trigger_level = 1; 400 break; 401 402 case UART_FCR_TRIGGER_4: 403 mdev_state->s[index].intr_trigger_level = 4; 404 break; 405 406 case UART_FCR_TRIGGER_8: 407 mdev_state->s[index].intr_trigger_level = 8; 408 break; 409 410 case UART_FCR_TRIGGER_14: 411 mdev_state->s[index].intr_trigger_level = 14; 412 break; 413 } 414 415 /* 416 * Set trigger level to 1 otherwise or implement timer with 417 * timeout of 4 characters and on expiring that timer set 418 * Recevice data timeout in IIR register 419 */ 420 mdev_state->s[index].intr_trigger_level = 1; 421 if (data & UART_FCR_ENABLE_FIFO) 422 mdev_state->s[index].max_fifo_size = MAX_FIFO_SIZE; 423 else { 424 mdev_state->s[index].max_fifo_size = 1; 425 mdev_state->s[index].intr_trigger_level = 1; 426 } 427 428 break; 429 430 case UART_LCR: 431 if (data & UART_LCR_DLAB) { 432 mdev_state->s[index].dlab = true; 433 mdev_state->s[index].divisor = 0; 434 } else 435 mdev_state->s[index].dlab = false; 436 437 mdev_state->s[index].uart_reg[offset] = data; 438 break; 439 440 case UART_MCR: 441 mdev_state->s[index].uart_reg[offset] = data; 442 443 if ((mdev_state->s[index].uart_reg[UART_IER] & UART_IER_MSI) && 444 (data & UART_MCR_OUT2)) { 445 #if defined(DEBUG_INTR) 446 pr_err("Serial port %d: MCR_OUT2 write\n", index); 447 #endif 448 mtty_trigger_interrupt(mdev_state); 449 } 450 451 if ((mdev_state->s[index].uart_reg[UART_IER] & UART_IER_MSI) && 452 (data & (UART_MCR_RTS | UART_MCR_DTR))) { 453 #if defined(DEBUG_INTR) 454 pr_err("Serial port %d: MCR RTS/DTR write\n", index); 455 #endif 456 mtty_trigger_interrupt(mdev_state); 457 } 458 break; 459 460 case UART_LSR: 461 case UART_MSR: 462 /* do nothing */ 463 break; 464 465 case UART_SCR: 466 mdev_state->s[index].uart_reg[offset] = data; 467 break; 468 469 default: 470 break; 471 } 472 } 473 474 static void handle_bar_read(unsigned int index, struct mdev_state *mdev_state, 475 u16 offset, u8 *buf, u32 count) 476 { 477 /* Handle read requests by guest */ 478 switch (offset) { 479 case UART_RX: 480 /* if DLAB set, data is LSB of divisor */ 481 if (mdev_state->s[index].dlab) { 482 *buf = (u8)mdev_state->s[index].divisor; 483 break; 484 } 485 486 mutex_lock(&mdev_state->rxtx_lock); 487 /* return data in tx buffer */ 488 if (mdev_state->s[index].rxtx.head != 489 mdev_state->s[index].rxtx.tail) { 490 *buf = mdev_state->s[index].rxtx.fifo[ 491 mdev_state->s[index].rxtx.tail]; 492 mdev_state->s[index].rxtx.count--; 493 CIRCULAR_BUF_INC_IDX(mdev_state->s[index].rxtx.tail); 494 } 495 496 if (mdev_state->s[index].rxtx.head == 497 mdev_state->s[index].rxtx.tail) { 498 /* 499 * Trigger interrupt if tx buffer empty interrupt is 500 * enabled and fifo is empty 501 */ 502 #if defined(DEBUG_INTR) 503 pr_err("Serial port %d: Buffer Empty\n", index); 504 #endif 505 if (mdev_state->s[index].uart_reg[UART_IER] & 506 UART_IER_THRI) 507 mtty_trigger_interrupt(mdev_state); 508 } 509 mutex_unlock(&mdev_state->rxtx_lock); 510 511 break; 512 513 case UART_IER: 514 if (mdev_state->s[index].dlab) { 515 *buf = (u8)(mdev_state->s[index].divisor >> 8); 516 break; 517 } 518 *buf = mdev_state->s[index].uart_reg[offset] & 0x0f; 519 break; 520 521 case UART_IIR: 522 { 523 u8 ier = mdev_state->s[index].uart_reg[UART_IER]; 524 *buf = 0; 525 526 mutex_lock(&mdev_state->rxtx_lock); 527 /* Interrupt priority 1: Parity, overrun, framing or break */ 528 if ((ier & UART_IER_RLSI) && mdev_state->s[index].overrun) 529 *buf |= UART_IIR_RLSI; 530 531 /* Interrupt priority 2: Fifo trigger level reached */ 532 if ((ier & UART_IER_RDI) && 533 (mdev_state->s[index].rxtx.count >= 534 mdev_state->s[index].intr_trigger_level)) 535 *buf |= UART_IIR_RDI; 536 537 /* Interrupt priotiry 3: transmitter holding register empty */ 538 if ((ier & UART_IER_THRI) && 539 (mdev_state->s[index].rxtx.head == 540 mdev_state->s[index].rxtx.tail)) 541 *buf |= UART_IIR_THRI; 542 543 /* Interrupt priotiry 4: Modem status: CTS, DSR, RI or DCD */ 544 if ((ier & UART_IER_MSI) && 545 (mdev_state->s[index].uart_reg[UART_MCR] & 546 (UART_MCR_RTS | UART_MCR_DTR))) 547 *buf |= UART_IIR_MSI; 548 549 /* bit0: 0=> interrupt pending, 1=> no interrupt is pending */ 550 if (*buf == 0) 551 *buf = UART_IIR_NO_INT; 552 553 /* set bit 6 & 7 to be 16550 compatible */ 554 *buf |= 0xC0; 555 mutex_unlock(&mdev_state->rxtx_lock); 556 } 557 break; 558 559 case UART_LCR: 560 case UART_MCR: 561 *buf = mdev_state->s[index].uart_reg[offset]; 562 break; 563 564 case UART_LSR: 565 { 566 u8 lsr = 0; 567 568 mutex_lock(&mdev_state->rxtx_lock); 569 /* atleast one char in FIFO */ 570 if (mdev_state->s[index].rxtx.head != 571 mdev_state->s[index].rxtx.tail) 572 lsr |= UART_LSR_DR; 573 574 /* if FIFO overrun */ 575 if (mdev_state->s[index].overrun) 576 lsr |= UART_LSR_OE; 577 578 /* transmit FIFO empty and tramsitter empty */ 579 if (mdev_state->s[index].rxtx.head == 580 mdev_state->s[index].rxtx.tail) 581 lsr |= UART_LSR_TEMT | UART_LSR_THRE; 582 583 mutex_unlock(&mdev_state->rxtx_lock); 584 *buf = lsr; 585 break; 586 } 587 case UART_MSR: 588 *buf = UART_MSR_DSR | UART_MSR_DDSR | UART_MSR_DCD; 589 590 mutex_lock(&mdev_state->rxtx_lock); 591 /* if AFE is 1 and FIFO have space, set CTS bit */ 592 if (mdev_state->s[index].uart_reg[UART_MCR] & 593 UART_MCR_AFE) { 594 if (mdev_state->s[index].rxtx.count < 595 mdev_state->s[index].max_fifo_size) 596 *buf |= UART_MSR_CTS | UART_MSR_DCTS; 597 } else 598 *buf |= UART_MSR_CTS | UART_MSR_DCTS; 599 mutex_unlock(&mdev_state->rxtx_lock); 600 601 break; 602 603 case UART_SCR: 604 *buf = mdev_state->s[index].uart_reg[offset]; 605 break; 606 607 default: 608 break; 609 } 610 } 611 612 static void mdev_read_base(struct mdev_state *mdev_state) 613 { 614 int index, pos; 615 u32 start_lo, start_hi; 616 u32 mem_type; 617 618 pos = PCI_BASE_ADDRESS_0; 619 620 for (index = 0; index <= VFIO_PCI_BAR5_REGION_INDEX; index++) { 621 622 if (!mdev_state->region_info[index].size) 623 continue; 624 625 start_lo = (*(u32 *)(mdev_state->vconfig + pos)) & 626 PCI_BASE_ADDRESS_MEM_MASK; 627 mem_type = (*(u32 *)(mdev_state->vconfig + pos)) & 628 PCI_BASE_ADDRESS_MEM_TYPE_MASK; 629 630 switch (mem_type) { 631 case PCI_BASE_ADDRESS_MEM_TYPE_64: 632 start_hi = (*(u32 *)(mdev_state->vconfig + pos + 4)); 633 pos += 4; 634 break; 635 case PCI_BASE_ADDRESS_MEM_TYPE_32: 636 case PCI_BASE_ADDRESS_MEM_TYPE_1M: 637 /* 1M mem BAR treated as 32-bit BAR */ 638 default: 639 /* mem unknown type treated as 32-bit BAR */ 640 start_hi = 0; 641 break; 642 } 643 pos += 4; 644 mdev_state->region_info[index].start = ((u64)start_hi << 32) | 645 start_lo; 646 } 647 } 648 649 static ssize_t mdev_access(struct mdev_state *mdev_state, u8 *buf, size_t count, 650 loff_t pos, bool is_write) 651 { 652 unsigned int index; 653 loff_t offset; 654 int ret = 0; 655 656 if (!buf) 657 return -EINVAL; 658 659 mutex_lock(&mdev_state->ops_lock); 660 661 index = MTTY_VFIO_PCI_OFFSET_TO_INDEX(pos); 662 offset = pos & MTTY_VFIO_PCI_OFFSET_MASK; 663 switch (index) { 664 case VFIO_PCI_CONFIG_REGION_INDEX: 665 666 #if defined(DEBUG) 667 pr_info("%s: PCI config space %s at offset 0x%llx\n", 668 __func__, is_write ? "write" : "read", offset); 669 #endif 670 if (is_write) { 671 dump_buffer(buf, count); 672 handle_pci_cfg_write(mdev_state, offset, buf, count); 673 } else { 674 memcpy(buf, (mdev_state->vconfig + offset), count); 675 dump_buffer(buf, count); 676 } 677 678 break; 679 680 case VFIO_PCI_BAR0_REGION_INDEX ... VFIO_PCI_BAR5_REGION_INDEX: 681 if (!mdev_state->region_info[index].start) 682 mdev_read_base(mdev_state); 683 684 if (is_write) { 685 dump_buffer(buf, count); 686 687 #if defined(DEBUG_REGS) 688 pr_info("%s: BAR%d WR @0x%llx %s val:0x%02x dlab:%d\n", 689 __func__, index, offset, wr_reg[offset], 690 *buf, mdev_state->s[index].dlab); 691 #endif 692 handle_bar_write(index, mdev_state, offset, buf, count); 693 } else { 694 handle_bar_read(index, mdev_state, offset, buf, count); 695 dump_buffer(buf, count); 696 697 #if defined(DEBUG_REGS) 698 pr_info("%s: BAR%d RD @0x%llx %s val:0x%02x dlab:%d\n", 699 __func__, index, offset, rd_reg[offset], 700 *buf, mdev_state->s[index].dlab); 701 #endif 702 } 703 break; 704 705 default: 706 ret = -1; 707 goto accessfailed; 708 } 709 710 ret = count; 711 712 713 accessfailed: 714 mutex_unlock(&mdev_state->ops_lock); 715 716 return ret; 717 } 718 719 static int mtty_init_dev(struct vfio_device *vdev) 720 { 721 struct mdev_state *mdev_state = 722 container_of(vdev, struct mdev_state, vdev); 723 struct mdev_device *mdev = to_mdev_device(vdev->dev); 724 struct mtty_type *type = 725 container_of(mdev->type, struct mtty_type, type); 726 int avail_ports = atomic_read(&mdev_avail_ports); 727 int ret; 728 729 do { 730 if (avail_ports < type->nr_ports) 731 return -ENOSPC; 732 } while (!atomic_try_cmpxchg(&mdev_avail_ports, 733 &avail_ports, 734 avail_ports - type->nr_ports)); 735 736 mdev_state->nr_ports = type->nr_ports; 737 mdev_state->irq_index = -1; 738 mdev_state->s[0].max_fifo_size = MAX_FIFO_SIZE; 739 mdev_state->s[1].max_fifo_size = MAX_FIFO_SIZE; 740 mutex_init(&mdev_state->rxtx_lock); 741 742 mdev_state->vconfig = kzalloc(MTTY_CONFIG_SPACE_SIZE, GFP_KERNEL); 743 if (!mdev_state->vconfig) { 744 ret = -ENOMEM; 745 goto err_nr_ports; 746 } 747 748 mutex_init(&mdev_state->ops_lock); 749 mdev_state->mdev = mdev; 750 mtty_create_config_space(mdev_state); 751 return 0; 752 753 err_nr_ports: 754 atomic_add(type->nr_ports, &mdev_avail_ports); 755 return ret; 756 } 757 758 static int mtty_probe(struct mdev_device *mdev) 759 { 760 struct mdev_state *mdev_state; 761 int ret; 762 763 mdev_state = vfio_alloc_device(mdev_state, vdev, &mdev->dev, 764 &mtty_dev_ops); 765 if (IS_ERR(mdev_state)) 766 return PTR_ERR(mdev_state); 767 768 ret = vfio_register_emulated_iommu_dev(&mdev_state->vdev); 769 if (ret) 770 goto err_put_vdev; 771 dev_set_drvdata(&mdev->dev, mdev_state); 772 return 0; 773 774 err_put_vdev: 775 vfio_put_device(&mdev_state->vdev); 776 return ret; 777 } 778 779 static void mtty_release_dev(struct vfio_device *vdev) 780 { 781 struct mdev_state *mdev_state = 782 container_of(vdev, struct mdev_state, vdev); 783 784 atomic_add(mdev_state->nr_ports, &mdev_avail_ports); 785 kfree(mdev_state->vconfig); 786 vfio_free_device(vdev); 787 } 788 789 static void mtty_remove(struct mdev_device *mdev) 790 { 791 struct mdev_state *mdev_state = dev_get_drvdata(&mdev->dev); 792 793 vfio_unregister_group_dev(&mdev_state->vdev); 794 vfio_put_device(&mdev_state->vdev); 795 } 796 797 static int mtty_reset(struct mdev_state *mdev_state) 798 { 799 pr_info("%s: called\n", __func__); 800 801 return 0; 802 } 803 804 static ssize_t mtty_read(struct vfio_device *vdev, char __user *buf, 805 size_t count, loff_t *ppos) 806 { 807 struct mdev_state *mdev_state = 808 container_of(vdev, struct mdev_state, vdev); 809 unsigned int done = 0; 810 int ret; 811 812 while (count) { 813 size_t filled; 814 815 if (count >= 4 && !(*ppos % 4)) { 816 u32 val; 817 818 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 819 *ppos, false); 820 if (ret <= 0) 821 goto read_err; 822 823 if (copy_to_user(buf, &val, sizeof(val))) 824 goto read_err; 825 826 filled = 4; 827 } else if (count >= 2 && !(*ppos % 2)) { 828 u16 val; 829 830 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 831 *ppos, false); 832 if (ret <= 0) 833 goto read_err; 834 835 if (copy_to_user(buf, &val, sizeof(val))) 836 goto read_err; 837 838 filled = 2; 839 } else { 840 u8 val; 841 842 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 843 *ppos, false); 844 if (ret <= 0) 845 goto read_err; 846 847 if (copy_to_user(buf, &val, sizeof(val))) 848 goto read_err; 849 850 filled = 1; 851 } 852 853 count -= filled; 854 done += filled; 855 *ppos += filled; 856 buf += filled; 857 } 858 859 return done; 860 861 read_err: 862 return -EFAULT; 863 } 864 865 static ssize_t mtty_write(struct vfio_device *vdev, const char __user *buf, 866 size_t count, loff_t *ppos) 867 { 868 struct mdev_state *mdev_state = 869 container_of(vdev, struct mdev_state, vdev); 870 unsigned int done = 0; 871 int ret; 872 873 while (count) { 874 size_t filled; 875 876 if (count >= 4 && !(*ppos % 4)) { 877 u32 val; 878 879 if (copy_from_user(&val, buf, sizeof(val))) 880 goto write_err; 881 882 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 883 *ppos, true); 884 if (ret <= 0) 885 goto write_err; 886 887 filled = 4; 888 } else if (count >= 2 && !(*ppos % 2)) { 889 u16 val; 890 891 if (copy_from_user(&val, buf, sizeof(val))) 892 goto write_err; 893 894 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 895 *ppos, true); 896 if (ret <= 0) 897 goto write_err; 898 899 filled = 2; 900 } else { 901 u8 val; 902 903 if (copy_from_user(&val, buf, sizeof(val))) 904 goto write_err; 905 906 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 907 *ppos, true); 908 if (ret <= 0) 909 goto write_err; 910 911 filled = 1; 912 } 913 count -= filled; 914 done += filled; 915 *ppos += filled; 916 buf += filled; 917 } 918 919 return done; 920 write_err: 921 return -EFAULT; 922 } 923 924 static int mtty_set_irqs(struct mdev_state *mdev_state, uint32_t flags, 925 unsigned int index, unsigned int start, 926 unsigned int count, void *data) 927 { 928 int ret = 0; 929 930 mutex_lock(&mdev_state->ops_lock); 931 switch (index) { 932 case VFIO_PCI_INTX_IRQ_INDEX: 933 switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) { 934 case VFIO_IRQ_SET_ACTION_MASK: 935 case VFIO_IRQ_SET_ACTION_UNMASK: 936 break; 937 case VFIO_IRQ_SET_ACTION_TRIGGER: 938 { 939 if (flags & VFIO_IRQ_SET_DATA_NONE) { 940 pr_info("%s: disable INTx\n", __func__); 941 if (mdev_state->intx_evtfd) 942 eventfd_ctx_put(mdev_state->intx_evtfd); 943 break; 944 } 945 946 if (flags & VFIO_IRQ_SET_DATA_EVENTFD) { 947 int fd = *(int *)data; 948 949 if (fd > 0) { 950 struct eventfd_ctx *evt; 951 952 evt = eventfd_ctx_fdget(fd); 953 if (IS_ERR(evt)) { 954 ret = PTR_ERR(evt); 955 break; 956 } 957 mdev_state->intx_evtfd = evt; 958 mdev_state->irq_fd = fd; 959 mdev_state->irq_index = index; 960 break; 961 } 962 } 963 break; 964 } 965 } 966 break; 967 case VFIO_PCI_MSI_IRQ_INDEX: 968 switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) { 969 case VFIO_IRQ_SET_ACTION_MASK: 970 case VFIO_IRQ_SET_ACTION_UNMASK: 971 break; 972 case VFIO_IRQ_SET_ACTION_TRIGGER: 973 if (flags & VFIO_IRQ_SET_DATA_NONE) { 974 if (mdev_state->msi_evtfd) 975 eventfd_ctx_put(mdev_state->msi_evtfd); 976 pr_info("%s: disable MSI\n", __func__); 977 mdev_state->irq_index = VFIO_PCI_INTX_IRQ_INDEX; 978 break; 979 } 980 if (flags & VFIO_IRQ_SET_DATA_EVENTFD) { 981 int fd = *(int *)data; 982 struct eventfd_ctx *evt; 983 984 if (fd <= 0) 985 break; 986 987 if (mdev_state->msi_evtfd) 988 break; 989 990 evt = eventfd_ctx_fdget(fd); 991 if (IS_ERR(evt)) { 992 ret = PTR_ERR(evt); 993 break; 994 } 995 mdev_state->msi_evtfd = evt; 996 mdev_state->irq_fd = fd; 997 mdev_state->irq_index = index; 998 } 999 break; 1000 } 1001 break; 1002 case VFIO_PCI_MSIX_IRQ_INDEX: 1003 pr_info("%s: MSIX_IRQ\n", __func__); 1004 break; 1005 case VFIO_PCI_ERR_IRQ_INDEX: 1006 pr_info("%s: ERR_IRQ\n", __func__); 1007 break; 1008 case VFIO_PCI_REQ_IRQ_INDEX: 1009 pr_info("%s: REQ_IRQ\n", __func__); 1010 break; 1011 } 1012 1013 mutex_unlock(&mdev_state->ops_lock); 1014 return ret; 1015 } 1016 1017 static int mtty_trigger_interrupt(struct mdev_state *mdev_state) 1018 { 1019 int ret = -1; 1020 1021 if ((mdev_state->irq_index == VFIO_PCI_MSI_IRQ_INDEX) && 1022 (!mdev_state->msi_evtfd)) 1023 return -EINVAL; 1024 else if ((mdev_state->irq_index == VFIO_PCI_INTX_IRQ_INDEX) && 1025 (!mdev_state->intx_evtfd)) { 1026 pr_info("%s: Intr eventfd not found\n", __func__); 1027 return -EINVAL; 1028 } 1029 1030 if (mdev_state->irq_index == VFIO_PCI_MSI_IRQ_INDEX) 1031 ret = eventfd_signal(mdev_state->msi_evtfd, 1); 1032 else 1033 ret = eventfd_signal(mdev_state->intx_evtfd, 1); 1034 1035 #if defined(DEBUG_INTR) 1036 pr_info("Intx triggered\n"); 1037 #endif 1038 if (ret != 1) 1039 pr_err("%s: eventfd signal failed (%d)\n", __func__, ret); 1040 1041 return ret; 1042 } 1043 1044 static int mtty_get_region_info(struct mdev_state *mdev_state, 1045 struct vfio_region_info *region_info, 1046 u16 *cap_type_id, void **cap_type) 1047 { 1048 unsigned int size = 0; 1049 u32 bar_index; 1050 1051 bar_index = region_info->index; 1052 if (bar_index >= VFIO_PCI_NUM_REGIONS) 1053 return -EINVAL; 1054 1055 mutex_lock(&mdev_state->ops_lock); 1056 1057 switch (bar_index) { 1058 case VFIO_PCI_CONFIG_REGION_INDEX: 1059 size = MTTY_CONFIG_SPACE_SIZE; 1060 break; 1061 case VFIO_PCI_BAR0_REGION_INDEX: 1062 size = MTTY_IO_BAR_SIZE; 1063 break; 1064 case VFIO_PCI_BAR1_REGION_INDEX: 1065 if (mdev_state->nr_ports == 2) 1066 size = MTTY_IO_BAR_SIZE; 1067 break; 1068 default: 1069 size = 0; 1070 break; 1071 } 1072 1073 mdev_state->region_info[bar_index].size = size; 1074 mdev_state->region_info[bar_index].vfio_offset = 1075 MTTY_VFIO_PCI_INDEX_TO_OFFSET(bar_index); 1076 1077 region_info->size = size; 1078 region_info->offset = MTTY_VFIO_PCI_INDEX_TO_OFFSET(bar_index); 1079 region_info->flags = VFIO_REGION_INFO_FLAG_READ | 1080 VFIO_REGION_INFO_FLAG_WRITE; 1081 mutex_unlock(&mdev_state->ops_lock); 1082 return 0; 1083 } 1084 1085 static int mtty_get_irq_info(struct vfio_irq_info *irq_info) 1086 { 1087 switch (irq_info->index) { 1088 case VFIO_PCI_INTX_IRQ_INDEX: 1089 case VFIO_PCI_MSI_IRQ_INDEX: 1090 case VFIO_PCI_REQ_IRQ_INDEX: 1091 break; 1092 1093 default: 1094 return -EINVAL; 1095 } 1096 1097 irq_info->flags = VFIO_IRQ_INFO_EVENTFD; 1098 irq_info->count = 1; 1099 1100 if (irq_info->index == VFIO_PCI_INTX_IRQ_INDEX) 1101 irq_info->flags |= (VFIO_IRQ_INFO_MASKABLE | 1102 VFIO_IRQ_INFO_AUTOMASKED); 1103 else 1104 irq_info->flags |= VFIO_IRQ_INFO_NORESIZE; 1105 1106 return 0; 1107 } 1108 1109 static int mtty_get_device_info(struct vfio_device_info *dev_info) 1110 { 1111 dev_info->flags = VFIO_DEVICE_FLAGS_PCI; 1112 dev_info->num_regions = VFIO_PCI_NUM_REGIONS; 1113 dev_info->num_irqs = VFIO_PCI_NUM_IRQS; 1114 1115 return 0; 1116 } 1117 1118 static long mtty_ioctl(struct vfio_device *vdev, unsigned int cmd, 1119 unsigned long arg) 1120 { 1121 struct mdev_state *mdev_state = 1122 container_of(vdev, struct mdev_state, vdev); 1123 int ret = 0; 1124 unsigned long minsz; 1125 1126 switch (cmd) { 1127 case VFIO_DEVICE_GET_INFO: 1128 { 1129 struct vfio_device_info info; 1130 1131 minsz = offsetofend(struct vfio_device_info, num_irqs); 1132 1133 if (copy_from_user(&info, (void __user *)arg, minsz)) 1134 return -EFAULT; 1135 1136 if (info.argsz < minsz) 1137 return -EINVAL; 1138 1139 ret = mtty_get_device_info(&info); 1140 if (ret) 1141 return ret; 1142 1143 memcpy(&mdev_state->dev_info, &info, sizeof(info)); 1144 1145 if (copy_to_user((void __user *)arg, &info, minsz)) 1146 return -EFAULT; 1147 1148 return 0; 1149 } 1150 case VFIO_DEVICE_GET_REGION_INFO: 1151 { 1152 struct vfio_region_info info; 1153 u16 cap_type_id = 0; 1154 void *cap_type = NULL; 1155 1156 minsz = offsetofend(struct vfio_region_info, offset); 1157 1158 if (copy_from_user(&info, (void __user *)arg, minsz)) 1159 return -EFAULT; 1160 1161 if (info.argsz < minsz) 1162 return -EINVAL; 1163 1164 ret = mtty_get_region_info(mdev_state, &info, &cap_type_id, 1165 &cap_type); 1166 if (ret) 1167 return ret; 1168 1169 if (copy_to_user((void __user *)arg, &info, minsz)) 1170 return -EFAULT; 1171 1172 return 0; 1173 } 1174 1175 case VFIO_DEVICE_GET_IRQ_INFO: 1176 { 1177 struct vfio_irq_info info; 1178 1179 minsz = offsetofend(struct vfio_irq_info, count); 1180 1181 if (copy_from_user(&info, (void __user *)arg, minsz)) 1182 return -EFAULT; 1183 1184 if ((info.argsz < minsz) || 1185 (info.index >= mdev_state->dev_info.num_irqs)) 1186 return -EINVAL; 1187 1188 ret = mtty_get_irq_info(&info); 1189 if (ret) 1190 return ret; 1191 1192 if (copy_to_user((void __user *)arg, &info, minsz)) 1193 return -EFAULT; 1194 1195 return 0; 1196 } 1197 case VFIO_DEVICE_SET_IRQS: 1198 { 1199 struct vfio_irq_set hdr; 1200 u8 *data = NULL, *ptr = NULL; 1201 size_t data_size = 0; 1202 1203 minsz = offsetofend(struct vfio_irq_set, count); 1204 1205 if (copy_from_user(&hdr, (void __user *)arg, minsz)) 1206 return -EFAULT; 1207 1208 ret = vfio_set_irqs_validate_and_prepare(&hdr, 1209 mdev_state->dev_info.num_irqs, 1210 VFIO_PCI_NUM_IRQS, 1211 &data_size); 1212 if (ret) 1213 return ret; 1214 1215 if (data_size) { 1216 ptr = data = memdup_user((void __user *)(arg + minsz), 1217 data_size); 1218 if (IS_ERR(data)) 1219 return PTR_ERR(data); 1220 } 1221 1222 ret = mtty_set_irqs(mdev_state, hdr.flags, hdr.index, hdr.start, 1223 hdr.count, data); 1224 1225 kfree(ptr); 1226 return ret; 1227 } 1228 case VFIO_DEVICE_RESET: 1229 return mtty_reset(mdev_state); 1230 } 1231 return -ENOTTY; 1232 } 1233 1234 static ssize_t 1235 sample_mdev_dev_show(struct device *dev, struct device_attribute *attr, 1236 char *buf) 1237 { 1238 return sprintf(buf, "This is MDEV %s\n", dev_name(dev)); 1239 } 1240 1241 static DEVICE_ATTR_RO(sample_mdev_dev); 1242 1243 static struct attribute *mdev_dev_attrs[] = { 1244 &dev_attr_sample_mdev_dev.attr, 1245 NULL, 1246 }; 1247 1248 static const struct attribute_group mdev_dev_group = { 1249 .name = "vendor", 1250 .attrs = mdev_dev_attrs, 1251 }; 1252 1253 static const struct attribute_group *mdev_dev_groups[] = { 1254 &mdev_dev_group, 1255 NULL, 1256 }; 1257 1258 static ssize_t name_show(struct mdev_type *mtype, 1259 struct mdev_type_attribute *attr, char *buf) 1260 { 1261 struct mtty_type *type = container_of(mtype, struct mtty_type, type); 1262 1263 return sysfs_emit(buf, "%s\n", type->name); 1264 } 1265 1266 static MDEV_TYPE_ATTR_RO(name); 1267 1268 static ssize_t available_instances_show(struct mdev_type *mtype, 1269 struct mdev_type_attribute *attr, 1270 char *buf) 1271 { 1272 struct mtty_type *type = container_of(mtype, struct mtty_type, type); 1273 1274 return sprintf(buf, "%d\n", atomic_read(&mdev_avail_ports) / 1275 type->nr_ports); 1276 } 1277 1278 static MDEV_TYPE_ATTR_RO(available_instances); 1279 1280 static ssize_t device_api_show(struct mdev_type *mtype, 1281 struct mdev_type_attribute *attr, char *buf) 1282 { 1283 return sprintf(buf, "%s\n", VFIO_DEVICE_API_PCI_STRING); 1284 } 1285 1286 static MDEV_TYPE_ATTR_RO(device_api); 1287 1288 static const struct attribute *mdev_types_attrs[] = { 1289 &mdev_type_attr_name.attr, 1290 &mdev_type_attr_device_api.attr, 1291 &mdev_type_attr_available_instances.attr, 1292 NULL, 1293 }; 1294 1295 static const struct vfio_device_ops mtty_dev_ops = { 1296 .name = "vfio-mtty", 1297 .init = mtty_init_dev, 1298 .release = mtty_release_dev, 1299 .read = mtty_read, 1300 .write = mtty_write, 1301 .ioctl = mtty_ioctl, 1302 }; 1303 1304 static struct mdev_driver mtty_driver = { 1305 .driver = { 1306 .name = "mtty", 1307 .owner = THIS_MODULE, 1308 .mod_name = KBUILD_MODNAME, 1309 .dev_groups = mdev_dev_groups, 1310 }, 1311 .probe = mtty_probe, 1312 .remove = mtty_remove, 1313 .types_attrs = mdev_types_attrs, 1314 }; 1315 1316 static void mtty_device_release(struct device *dev) 1317 { 1318 dev_dbg(dev, "mtty: released\n"); 1319 } 1320 1321 static int __init mtty_dev_init(void) 1322 { 1323 int ret = 0; 1324 1325 pr_info("mtty_dev: %s\n", __func__); 1326 1327 memset(&mtty_dev, 0, sizeof(mtty_dev)); 1328 1329 idr_init(&mtty_dev.vd_idr); 1330 1331 ret = alloc_chrdev_region(&mtty_dev.vd_devt, 0, MINORMASK + 1, 1332 MTTY_NAME); 1333 1334 if (ret < 0) { 1335 pr_err("Error: failed to register mtty_dev, err:%d\n", ret); 1336 return ret; 1337 } 1338 1339 cdev_init(&mtty_dev.vd_cdev, &vd_fops); 1340 cdev_add(&mtty_dev.vd_cdev, mtty_dev.vd_devt, MINORMASK + 1); 1341 1342 pr_info("major_number:%d\n", MAJOR(mtty_dev.vd_devt)); 1343 1344 ret = mdev_register_driver(&mtty_driver); 1345 if (ret) 1346 goto err_cdev; 1347 1348 mtty_dev.vd_class = class_create(THIS_MODULE, MTTY_CLASS_NAME); 1349 1350 if (IS_ERR(mtty_dev.vd_class)) { 1351 pr_err("Error: failed to register mtty_dev class\n"); 1352 ret = PTR_ERR(mtty_dev.vd_class); 1353 goto err_driver; 1354 } 1355 1356 mtty_dev.dev.class = mtty_dev.vd_class; 1357 mtty_dev.dev.release = mtty_device_release; 1358 dev_set_name(&mtty_dev.dev, "%s", MTTY_NAME); 1359 1360 ret = device_register(&mtty_dev.dev); 1361 if (ret) 1362 goto err_class; 1363 1364 ret = mdev_register_parent(&mtty_dev.parent, &mtty_dev.dev, 1365 &mtty_driver, mtty_mdev_types, 1366 ARRAY_SIZE(mtty_mdev_types)); 1367 if (ret) 1368 goto err_device; 1369 return 0; 1370 1371 err_device: 1372 device_unregister(&mtty_dev.dev); 1373 err_class: 1374 class_destroy(mtty_dev.vd_class); 1375 err_driver: 1376 mdev_unregister_driver(&mtty_driver); 1377 err_cdev: 1378 cdev_del(&mtty_dev.vd_cdev); 1379 unregister_chrdev_region(mtty_dev.vd_devt, MINORMASK + 1); 1380 return ret; 1381 } 1382 1383 static void __exit mtty_dev_exit(void) 1384 { 1385 mtty_dev.dev.bus = NULL; 1386 mdev_unregister_parent(&mtty_dev.parent); 1387 1388 device_unregister(&mtty_dev.dev); 1389 idr_destroy(&mtty_dev.vd_idr); 1390 mdev_unregister_driver(&mtty_driver); 1391 cdev_del(&mtty_dev.vd_cdev); 1392 unregister_chrdev_region(mtty_dev.vd_devt, MINORMASK + 1); 1393 class_destroy(mtty_dev.vd_class); 1394 mtty_dev.vd_class = NULL; 1395 pr_info("mtty_dev: Unloaded!\n"); 1396 } 1397 1398 module_init(mtty_dev_init) 1399 module_exit(mtty_dev_exit) 1400 1401 MODULE_LICENSE("GPL v2"); 1402 MODULE_INFO(supported, "Test driver that simulate serial port over PCI"); 1403 MODULE_VERSION(VERSION_STRING); 1404 MODULE_AUTHOR(DRIVER_AUTHOR); 1405