1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Mediated virtual PCI serial host device driver 4 * 5 * Copyright (c) 2016, NVIDIA CORPORATION. All rights reserved. 6 * Author: Neo Jia <cjia@nvidia.com> 7 * Kirti Wankhede <kwankhede@nvidia.com> 8 * 9 * Sample driver that creates mdev device that simulates serial port over PCI 10 * card. 11 */ 12 13 #include <linux/init.h> 14 #include <linux/module.h> 15 #include <linux/device.h> 16 #include <linux/kernel.h> 17 #include <linux/fs.h> 18 #include <linux/poll.h> 19 #include <linux/slab.h> 20 #include <linux/cdev.h> 21 #include <linux/sched.h> 22 #include <linux/wait.h> 23 #include <linux/uuid.h> 24 #include <linux/vfio.h> 25 #include <linux/iommu.h> 26 #include <linux/sysfs.h> 27 #include <linux/ctype.h> 28 #include <linux/file.h> 29 #include <linux/mdev.h> 30 #include <linux/pci.h> 31 #include <linux/serial.h> 32 #include <uapi/linux/serial_reg.h> 33 #include <linux/eventfd.h> 34 /* 35 * #defines 36 */ 37 38 #define VERSION_STRING "0.1" 39 #define DRIVER_AUTHOR "NVIDIA Corporation" 40 41 #define MTTY_CLASS_NAME "mtty" 42 43 #define MTTY_NAME "mtty" 44 45 #define MTTY_STRING_LEN 16 46 47 #define MTTY_CONFIG_SPACE_SIZE 0xff 48 #define MTTY_IO_BAR_SIZE 0x8 49 #define MTTY_MMIO_BAR_SIZE 0x100000 50 51 #define STORE_LE16(addr, val) (*(u16 *)addr = val) 52 #define STORE_LE32(addr, val) (*(u32 *)addr = val) 53 54 #define MAX_FIFO_SIZE 16 55 56 #define CIRCULAR_BUF_INC_IDX(idx) (idx = (idx + 1) & (MAX_FIFO_SIZE - 1)) 57 58 #define MTTY_VFIO_PCI_OFFSET_SHIFT 40 59 60 #define MTTY_VFIO_PCI_OFFSET_TO_INDEX(off) (off >> MTTY_VFIO_PCI_OFFSET_SHIFT) 61 #define MTTY_VFIO_PCI_INDEX_TO_OFFSET(index) \ 62 ((u64)(index) << MTTY_VFIO_PCI_OFFSET_SHIFT) 63 #define MTTY_VFIO_PCI_OFFSET_MASK \ 64 (((u64)(1) << MTTY_VFIO_PCI_OFFSET_SHIFT) - 1) 65 #define MAX_MTTYS 24 66 67 /* 68 * Global Structures 69 */ 70 71 static struct mtty_dev { 72 dev_t vd_devt; 73 struct class *vd_class; 74 struct cdev vd_cdev; 75 struct idr vd_idr; 76 struct device dev; 77 } mtty_dev; 78 79 struct mdev_region_info { 80 u64 start; 81 u64 phys_start; 82 u32 size; 83 u64 vfio_offset; 84 }; 85 86 #if defined(DEBUG_REGS) 87 static const char *wr_reg[] = { 88 "TX", 89 "IER", 90 "FCR", 91 "LCR", 92 "MCR", 93 "LSR", 94 "MSR", 95 "SCR" 96 }; 97 98 static const char *rd_reg[] = { 99 "RX", 100 "IER", 101 "IIR", 102 "LCR", 103 "MCR", 104 "LSR", 105 "MSR", 106 "SCR" 107 }; 108 #endif 109 110 /* loop back buffer */ 111 struct rxtx { 112 u8 fifo[MAX_FIFO_SIZE]; 113 u8 head, tail; 114 u8 count; 115 }; 116 117 struct serial_port { 118 u8 uart_reg[8]; /* 8 registers */ 119 struct rxtx rxtx; /* loop back buffer */ 120 bool dlab; 121 bool overrun; 122 u16 divisor; 123 u8 fcr; /* FIFO control register */ 124 u8 max_fifo_size; 125 u8 intr_trigger_level; /* interrupt trigger level */ 126 }; 127 128 /* State of each mdev device */ 129 struct mdev_state { 130 struct vfio_device vdev; 131 int irq_fd; 132 struct eventfd_ctx *intx_evtfd; 133 struct eventfd_ctx *msi_evtfd; 134 int irq_index; 135 u8 *vconfig; 136 struct mutex ops_lock; 137 struct mdev_device *mdev; 138 struct mdev_region_info region_info[VFIO_PCI_NUM_REGIONS]; 139 u32 bar_mask[VFIO_PCI_NUM_REGIONS]; 140 struct list_head next; 141 struct serial_port s[2]; 142 struct mutex rxtx_lock; 143 struct vfio_device_info dev_info; 144 int nr_ports; 145 }; 146 147 static atomic_t mdev_avail_ports = ATOMIC_INIT(MAX_MTTYS); 148 149 static const struct file_operations vd_fops = { 150 .owner = THIS_MODULE, 151 }; 152 153 static const struct vfio_device_ops mtty_dev_ops; 154 155 /* function prototypes */ 156 157 static int mtty_trigger_interrupt(struct mdev_state *mdev_state); 158 159 /* Helper functions */ 160 161 static void dump_buffer(u8 *buf, uint32_t count) 162 { 163 #if defined(DEBUG) 164 int i; 165 166 pr_info("Buffer:\n"); 167 for (i = 0; i < count; i++) { 168 pr_info("%2x ", *(buf + i)); 169 if ((i + 1) % 16 == 0) 170 pr_info("\n"); 171 } 172 #endif 173 } 174 175 static void mtty_create_config_space(struct mdev_state *mdev_state) 176 { 177 /* PCI dev ID */ 178 STORE_LE32((u32 *) &mdev_state->vconfig[0x0], 0x32534348); 179 180 /* Control: I/O+, Mem-, BusMaster- */ 181 STORE_LE16((u16 *) &mdev_state->vconfig[0x4], 0x0001); 182 183 /* Status: capabilities list absent */ 184 STORE_LE16((u16 *) &mdev_state->vconfig[0x6], 0x0200); 185 186 /* Rev ID */ 187 mdev_state->vconfig[0x8] = 0x10; 188 189 /* programming interface class : 16550-compatible serial controller */ 190 mdev_state->vconfig[0x9] = 0x02; 191 192 /* Sub class : 00 */ 193 mdev_state->vconfig[0xa] = 0x00; 194 195 /* Base class : Simple Communication controllers */ 196 mdev_state->vconfig[0xb] = 0x07; 197 198 /* base address registers */ 199 /* BAR0: IO space */ 200 STORE_LE32((u32 *) &mdev_state->vconfig[0x10], 0x000001); 201 mdev_state->bar_mask[0] = ~(MTTY_IO_BAR_SIZE) + 1; 202 203 if (mdev_state->nr_ports == 2) { 204 /* BAR1: IO space */ 205 STORE_LE32((u32 *) &mdev_state->vconfig[0x14], 0x000001); 206 mdev_state->bar_mask[1] = ~(MTTY_IO_BAR_SIZE) + 1; 207 } 208 209 /* Subsystem ID */ 210 STORE_LE32((u32 *) &mdev_state->vconfig[0x2c], 0x32534348); 211 212 mdev_state->vconfig[0x34] = 0x00; /* Cap Ptr */ 213 mdev_state->vconfig[0x3d] = 0x01; /* interrupt pin (INTA#) */ 214 215 /* Vendor specific data */ 216 mdev_state->vconfig[0x40] = 0x23; 217 mdev_state->vconfig[0x43] = 0x80; 218 mdev_state->vconfig[0x44] = 0x23; 219 mdev_state->vconfig[0x48] = 0x23; 220 mdev_state->vconfig[0x4c] = 0x23; 221 222 mdev_state->vconfig[0x60] = 0x50; 223 mdev_state->vconfig[0x61] = 0x43; 224 mdev_state->vconfig[0x62] = 0x49; 225 mdev_state->vconfig[0x63] = 0x20; 226 mdev_state->vconfig[0x64] = 0x53; 227 mdev_state->vconfig[0x65] = 0x65; 228 mdev_state->vconfig[0x66] = 0x72; 229 mdev_state->vconfig[0x67] = 0x69; 230 mdev_state->vconfig[0x68] = 0x61; 231 mdev_state->vconfig[0x69] = 0x6c; 232 mdev_state->vconfig[0x6a] = 0x2f; 233 mdev_state->vconfig[0x6b] = 0x55; 234 mdev_state->vconfig[0x6c] = 0x41; 235 mdev_state->vconfig[0x6d] = 0x52; 236 mdev_state->vconfig[0x6e] = 0x54; 237 } 238 239 static void handle_pci_cfg_write(struct mdev_state *mdev_state, u16 offset, 240 u8 *buf, u32 count) 241 { 242 u32 cfg_addr, bar_mask, bar_index = 0; 243 244 switch (offset) { 245 case 0x04: /* device control */ 246 case 0x06: /* device status */ 247 /* do nothing */ 248 break; 249 case 0x3c: /* interrupt line */ 250 mdev_state->vconfig[0x3c] = buf[0]; 251 break; 252 case 0x3d: 253 /* 254 * Interrupt Pin is hardwired to INTA. 255 * This field is write protected by hardware 256 */ 257 break; 258 case 0x10: /* BAR0 */ 259 case 0x14: /* BAR1 */ 260 if (offset == 0x10) 261 bar_index = 0; 262 else if (offset == 0x14) 263 bar_index = 1; 264 265 if ((mdev_state->nr_ports == 1) && (bar_index == 1)) { 266 STORE_LE32(&mdev_state->vconfig[offset], 0); 267 break; 268 } 269 270 cfg_addr = *(u32 *)buf; 271 pr_info("BAR%d addr 0x%x\n", bar_index, cfg_addr); 272 273 if (cfg_addr == 0xffffffff) { 274 bar_mask = mdev_state->bar_mask[bar_index]; 275 cfg_addr = (cfg_addr & bar_mask); 276 } 277 278 cfg_addr |= (mdev_state->vconfig[offset] & 0x3ul); 279 STORE_LE32(&mdev_state->vconfig[offset], cfg_addr); 280 break; 281 case 0x18: /* BAR2 */ 282 case 0x1c: /* BAR3 */ 283 case 0x20: /* BAR4 */ 284 STORE_LE32(&mdev_state->vconfig[offset], 0); 285 break; 286 default: 287 pr_info("PCI config write @0x%x of %d bytes not handled\n", 288 offset, count); 289 break; 290 } 291 } 292 293 static void handle_bar_write(unsigned int index, struct mdev_state *mdev_state, 294 u16 offset, u8 *buf, u32 count) 295 { 296 u8 data = *buf; 297 298 /* Handle data written by guest */ 299 switch (offset) { 300 case UART_TX: 301 /* if DLAB set, data is LSB of divisor */ 302 if (mdev_state->s[index].dlab) { 303 mdev_state->s[index].divisor |= data; 304 break; 305 } 306 307 mutex_lock(&mdev_state->rxtx_lock); 308 309 /* save in TX buffer */ 310 if (mdev_state->s[index].rxtx.count < 311 mdev_state->s[index].max_fifo_size) { 312 mdev_state->s[index].rxtx.fifo[ 313 mdev_state->s[index].rxtx.head] = data; 314 mdev_state->s[index].rxtx.count++; 315 CIRCULAR_BUF_INC_IDX(mdev_state->s[index].rxtx.head); 316 mdev_state->s[index].overrun = false; 317 318 /* 319 * Trigger interrupt if receive data interrupt is 320 * enabled and fifo reached trigger level 321 */ 322 if ((mdev_state->s[index].uart_reg[UART_IER] & 323 UART_IER_RDI) && 324 (mdev_state->s[index].rxtx.count == 325 mdev_state->s[index].intr_trigger_level)) { 326 /* trigger interrupt */ 327 #if defined(DEBUG_INTR) 328 pr_err("Serial port %d: Fifo level trigger\n", 329 index); 330 #endif 331 mtty_trigger_interrupt(mdev_state); 332 } 333 } else { 334 #if defined(DEBUG_INTR) 335 pr_err("Serial port %d: Buffer Overflow\n", index); 336 #endif 337 mdev_state->s[index].overrun = true; 338 339 /* 340 * Trigger interrupt if receiver line status interrupt 341 * is enabled 342 */ 343 if (mdev_state->s[index].uart_reg[UART_IER] & 344 UART_IER_RLSI) 345 mtty_trigger_interrupt(mdev_state); 346 } 347 mutex_unlock(&mdev_state->rxtx_lock); 348 break; 349 350 case UART_IER: 351 /* if DLAB set, data is MSB of divisor */ 352 if (mdev_state->s[index].dlab) 353 mdev_state->s[index].divisor |= (u16)data << 8; 354 else { 355 mdev_state->s[index].uart_reg[offset] = data; 356 mutex_lock(&mdev_state->rxtx_lock); 357 if ((data & UART_IER_THRI) && 358 (mdev_state->s[index].rxtx.head == 359 mdev_state->s[index].rxtx.tail)) { 360 #if defined(DEBUG_INTR) 361 pr_err("Serial port %d: IER_THRI write\n", 362 index); 363 #endif 364 mtty_trigger_interrupt(mdev_state); 365 } 366 367 mutex_unlock(&mdev_state->rxtx_lock); 368 } 369 370 break; 371 372 case UART_FCR: 373 mdev_state->s[index].fcr = data; 374 375 mutex_lock(&mdev_state->rxtx_lock); 376 if (data & (UART_FCR_CLEAR_RCVR | UART_FCR_CLEAR_XMIT)) { 377 /* clear loop back FIFO */ 378 mdev_state->s[index].rxtx.count = 0; 379 mdev_state->s[index].rxtx.head = 0; 380 mdev_state->s[index].rxtx.tail = 0; 381 } 382 mutex_unlock(&mdev_state->rxtx_lock); 383 384 switch (data & UART_FCR_TRIGGER_MASK) { 385 case UART_FCR_TRIGGER_1: 386 mdev_state->s[index].intr_trigger_level = 1; 387 break; 388 389 case UART_FCR_TRIGGER_4: 390 mdev_state->s[index].intr_trigger_level = 4; 391 break; 392 393 case UART_FCR_TRIGGER_8: 394 mdev_state->s[index].intr_trigger_level = 8; 395 break; 396 397 case UART_FCR_TRIGGER_14: 398 mdev_state->s[index].intr_trigger_level = 14; 399 break; 400 } 401 402 /* 403 * Set trigger level to 1 otherwise or implement timer with 404 * timeout of 4 characters and on expiring that timer set 405 * Recevice data timeout in IIR register 406 */ 407 mdev_state->s[index].intr_trigger_level = 1; 408 if (data & UART_FCR_ENABLE_FIFO) 409 mdev_state->s[index].max_fifo_size = MAX_FIFO_SIZE; 410 else { 411 mdev_state->s[index].max_fifo_size = 1; 412 mdev_state->s[index].intr_trigger_level = 1; 413 } 414 415 break; 416 417 case UART_LCR: 418 if (data & UART_LCR_DLAB) { 419 mdev_state->s[index].dlab = true; 420 mdev_state->s[index].divisor = 0; 421 } else 422 mdev_state->s[index].dlab = false; 423 424 mdev_state->s[index].uart_reg[offset] = data; 425 break; 426 427 case UART_MCR: 428 mdev_state->s[index].uart_reg[offset] = data; 429 430 if ((mdev_state->s[index].uart_reg[UART_IER] & UART_IER_MSI) && 431 (data & UART_MCR_OUT2)) { 432 #if defined(DEBUG_INTR) 433 pr_err("Serial port %d: MCR_OUT2 write\n", index); 434 #endif 435 mtty_trigger_interrupt(mdev_state); 436 } 437 438 if ((mdev_state->s[index].uart_reg[UART_IER] & UART_IER_MSI) && 439 (data & (UART_MCR_RTS | UART_MCR_DTR))) { 440 #if defined(DEBUG_INTR) 441 pr_err("Serial port %d: MCR RTS/DTR write\n", index); 442 #endif 443 mtty_trigger_interrupt(mdev_state); 444 } 445 break; 446 447 case UART_LSR: 448 case UART_MSR: 449 /* do nothing */ 450 break; 451 452 case UART_SCR: 453 mdev_state->s[index].uart_reg[offset] = data; 454 break; 455 456 default: 457 break; 458 } 459 } 460 461 static void handle_bar_read(unsigned int index, struct mdev_state *mdev_state, 462 u16 offset, u8 *buf, u32 count) 463 { 464 /* Handle read requests by guest */ 465 switch (offset) { 466 case UART_RX: 467 /* if DLAB set, data is LSB of divisor */ 468 if (mdev_state->s[index].dlab) { 469 *buf = (u8)mdev_state->s[index].divisor; 470 break; 471 } 472 473 mutex_lock(&mdev_state->rxtx_lock); 474 /* return data in tx buffer */ 475 if (mdev_state->s[index].rxtx.head != 476 mdev_state->s[index].rxtx.tail) { 477 *buf = mdev_state->s[index].rxtx.fifo[ 478 mdev_state->s[index].rxtx.tail]; 479 mdev_state->s[index].rxtx.count--; 480 CIRCULAR_BUF_INC_IDX(mdev_state->s[index].rxtx.tail); 481 } 482 483 if (mdev_state->s[index].rxtx.head == 484 mdev_state->s[index].rxtx.tail) { 485 /* 486 * Trigger interrupt if tx buffer empty interrupt is 487 * enabled and fifo is empty 488 */ 489 #if defined(DEBUG_INTR) 490 pr_err("Serial port %d: Buffer Empty\n", index); 491 #endif 492 if (mdev_state->s[index].uart_reg[UART_IER] & 493 UART_IER_THRI) 494 mtty_trigger_interrupt(mdev_state); 495 } 496 mutex_unlock(&mdev_state->rxtx_lock); 497 498 break; 499 500 case UART_IER: 501 if (mdev_state->s[index].dlab) { 502 *buf = (u8)(mdev_state->s[index].divisor >> 8); 503 break; 504 } 505 *buf = mdev_state->s[index].uart_reg[offset] & 0x0f; 506 break; 507 508 case UART_IIR: 509 { 510 u8 ier = mdev_state->s[index].uart_reg[UART_IER]; 511 *buf = 0; 512 513 mutex_lock(&mdev_state->rxtx_lock); 514 /* Interrupt priority 1: Parity, overrun, framing or break */ 515 if ((ier & UART_IER_RLSI) && mdev_state->s[index].overrun) 516 *buf |= UART_IIR_RLSI; 517 518 /* Interrupt priority 2: Fifo trigger level reached */ 519 if ((ier & UART_IER_RDI) && 520 (mdev_state->s[index].rxtx.count >= 521 mdev_state->s[index].intr_trigger_level)) 522 *buf |= UART_IIR_RDI; 523 524 /* Interrupt priotiry 3: transmitter holding register empty */ 525 if ((ier & UART_IER_THRI) && 526 (mdev_state->s[index].rxtx.head == 527 mdev_state->s[index].rxtx.tail)) 528 *buf |= UART_IIR_THRI; 529 530 /* Interrupt priotiry 4: Modem status: CTS, DSR, RI or DCD */ 531 if ((ier & UART_IER_MSI) && 532 (mdev_state->s[index].uart_reg[UART_MCR] & 533 (UART_MCR_RTS | UART_MCR_DTR))) 534 *buf |= UART_IIR_MSI; 535 536 /* bit0: 0=> interrupt pending, 1=> no interrupt is pending */ 537 if (*buf == 0) 538 *buf = UART_IIR_NO_INT; 539 540 /* set bit 6 & 7 to be 16550 compatible */ 541 *buf |= 0xC0; 542 mutex_unlock(&mdev_state->rxtx_lock); 543 } 544 break; 545 546 case UART_LCR: 547 case UART_MCR: 548 *buf = mdev_state->s[index].uart_reg[offset]; 549 break; 550 551 case UART_LSR: 552 { 553 u8 lsr = 0; 554 555 mutex_lock(&mdev_state->rxtx_lock); 556 /* atleast one char in FIFO */ 557 if (mdev_state->s[index].rxtx.head != 558 mdev_state->s[index].rxtx.tail) 559 lsr |= UART_LSR_DR; 560 561 /* if FIFO overrun */ 562 if (mdev_state->s[index].overrun) 563 lsr |= UART_LSR_OE; 564 565 /* transmit FIFO empty and tramsitter empty */ 566 if (mdev_state->s[index].rxtx.head == 567 mdev_state->s[index].rxtx.tail) 568 lsr |= UART_LSR_TEMT | UART_LSR_THRE; 569 570 mutex_unlock(&mdev_state->rxtx_lock); 571 *buf = lsr; 572 break; 573 } 574 case UART_MSR: 575 *buf = UART_MSR_DSR | UART_MSR_DDSR | UART_MSR_DCD; 576 577 mutex_lock(&mdev_state->rxtx_lock); 578 /* if AFE is 1 and FIFO have space, set CTS bit */ 579 if (mdev_state->s[index].uart_reg[UART_MCR] & 580 UART_MCR_AFE) { 581 if (mdev_state->s[index].rxtx.count < 582 mdev_state->s[index].max_fifo_size) 583 *buf |= UART_MSR_CTS | UART_MSR_DCTS; 584 } else 585 *buf |= UART_MSR_CTS | UART_MSR_DCTS; 586 mutex_unlock(&mdev_state->rxtx_lock); 587 588 break; 589 590 case UART_SCR: 591 *buf = mdev_state->s[index].uart_reg[offset]; 592 break; 593 594 default: 595 break; 596 } 597 } 598 599 static void mdev_read_base(struct mdev_state *mdev_state) 600 { 601 int index, pos; 602 u32 start_lo, start_hi; 603 u32 mem_type; 604 605 pos = PCI_BASE_ADDRESS_0; 606 607 for (index = 0; index <= VFIO_PCI_BAR5_REGION_INDEX; index++) { 608 609 if (!mdev_state->region_info[index].size) 610 continue; 611 612 start_lo = (*(u32 *)(mdev_state->vconfig + pos)) & 613 PCI_BASE_ADDRESS_MEM_MASK; 614 mem_type = (*(u32 *)(mdev_state->vconfig + pos)) & 615 PCI_BASE_ADDRESS_MEM_TYPE_MASK; 616 617 switch (mem_type) { 618 case PCI_BASE_ADDRESS_MEM_TYPE_64: 619 start_hi = (*(u32 *)(mdev_state->vconfig + pos + 4)); 620 pos += 4; 621 break; 622 case PCI_BASE_ADDRESS_MEM_TYPE_32: 623 case PCI_BASE_ADDRESS_MEM_TYPE_1M: 624 /* 1M mem BAR treated as 32-bit BAR */ 625 default: 626 /* mem unknown type treated as 32-bit BAR */ 627 start_hi = 0; 628 break; 629 } 630 pos += 4; 631 mdev_state->region_info[index].start = ((u64)start_hi << 32) | 632 start_lo; 633 } 634 } 635 636 static ssize_t mdev_access(struct mdev_state *mdev_state, u8 *buf, size_t count, 637 loff_t pos, bool is_write) 638 { 639 unsigned int index; 640 loff_t offset; 641 int ret = 0; 642 643 if (!buf) 644 return -EINVAL; 645 646 mutex_lock(&mdev_state->ops_lock); 647 648 index = MTTY_VFIO_PCI_OFFSET_TO_INDEX(pos); 649 offset = pos & MTTY_VFIO_PCI_OFFSET_MASK; 650 switch (index) { 651 case VFIO_PCI_CONFIG_REGION_INDEX: 652 653 #if defined(DEBUG) 654 pr_info("%s: PCI config space %s at offset 0x%llx\n", 655 __func__, is_write ? "write" : "read", offset); 656 #endif 657 if (is_write) { 658 dump_buffer(buf, count); 659 handle_pci_cfg_write(mdev_state, offset, buf, count); 660 } else { 661 memcpy(buf, (mdev_state->vconfig + offset), count); 662 dump_buffer(buf, count); 663 } 664 665 break; 666 667 case VFIO_PCI_BAR0_REGION_INDEX ... VFIO_PCI_BAR5_REGION_INDEX: 668 if (!mdev_state->region_info[index].start) 669 mdev_read_base(mdev_state); 670 671 if (is_write) { 672 dump_buffer(buf, count); 673 674 #if defined(DEBUG_REGS) 675 pr_info("%s: BAR%d WR @0x%llx %s val:0x%02x dlab:%d\n", 676 __func__, index, offset, wr_reg[offset], 677 *buf, mdev_state->s[index].dlab); 678 #endif 679 handle_bar_write(index, mdev_state, offset, buf, count); 680 } else { 681 handle_bar_read(index, mdev_state, offset, buf, count); 682 dump_buffer(buf, count); 683 684 #if defined(DEBUG_REGS) 685 pr_info("%s: BAR%d RD @0x%llx %s val:0x%02x dlab:%d\n", 686 __func__, index, offset, rd_reg[offset], 687 *buf, mdev_state->s[index].dlab); 688 #endif 689 } 690 break; 691 692 default: 693 ret = -1; 694 goto accessfailed; 695 } 696 697 ret = count; 698 699 700 accessfailed: 701 mutex_unlock(&mdev_state->ops_lock); 702 703 return ret; 704 } 705 706 static int mtty_init_dev(struct vfio_device *vdev) 707 { 708 struct mdev_state *mdev_state = 709 container_of(vdev, struct mdev_state, vdev); 710 struct mdev_device *mdev = to_mdev_device(vdev->dev); 711 int nr_ports = mdev_get_type_group_id(mdev) + 1; 712 int avail_ports = atomic_read(&mdev_avail_ports); 713 int ret; 714 715 do { 716 if (avail_ports < nr_ports) 717 return -ENOSPC; 718 } while (!atomic_try_cmpxchg(&mdev_avail_ports, 719 &avail_ports, avail_ports - nr_ports)); 720 721 mdev_state->nr_ports = nr_ports; 722 mdev_state->irq_index = -1; 723 mdev_state->s[0].max_fifo_size = MAX_FIFO_SIZE; 724 mdev_state->s[1].max_fifo_size = MAX_FIFO_SIZE; 725 mutex_init(&mdev_state->rxtx_lock); 726 727 mdev_state->vconfig = kzalloc(MTTY_CONFIG_SPACE_SIZE, GFP_KERNEL); 728 if (!mdev_state->vconfig) { 729 ret = -ENOMEM; 730 goto err_nr_ports; 731 } 732 733 mutex_init(&mdev_state->ops_lock); 734 mdev_state->mdev = mdev; 735 mtty_create_config_space(mdev_state); 736 return 0; 737 738 err_nr_ports: 739 atomic_add(nr_ports, &mdev_avail_ports); 740 return ret; 741 } 742 743 static int mtty_probe(struct mdev_device *mdev) 744 { 745 struct mdev_state *mdev_state; 746 int ret; 747 748 mdev_state = vfio_alloc_device(mdev_state, vdev, &mdev->dev, 749 &mtty_dev_ops); 750 if (IS_ERR(mdev_state)) 751 return PTR_ERR(mdev_state); 752 753 ret = vfio_register_emulated_iommu_dev(&mdev_state->vdev); 754 if (ret) 755 goto err_put_vdev; 756 dev_set_drvdata(&mdev->dev, mdev_state); 757 return 0; 758 759 err_put_vdev: 760 vfio_put_device(&mdev_state->vdev); 761 return ret; 762 } 763 764 static void mtty_release_dev(struct vfio_device *vdev) 765 { 766 struct mdev_state *mdev_state = 767 container_of(vdev, struct mdev_state, vdev); 768 769 atomic_add(mdev_state->nr_ports, &mdev_avail_ports); 770 kfree(mdev_state->vconfig); 771 vfio_free_device(vdev); 772 } 773 774 static void mtty_remove(struct mdev_device *mdev) 775 { 776 struct mdev_state *mdev_state = dev_get_drvdata(&mdev->dev); 777 778 vfio_unregister_group_dev(&mdev_state->vdev); 779 vfio_put_device(&mdev_state->vdev); 780 } 781 782 static int mtty_reset(struct mdev_state *mdev_state) 783 { 784 pr_info("%s: called\n", __func__); 785 786 return 0; 787 } 788 789 static ssize_t mtty_read(struct vfio_device *vdev, char __user *buf, 790 size_t count, loff_t *ppos) 791 { 792 struct mdev_state *mdev_state = 793 container_of(vdev, struct mdev_state, vdev); 794 unsigned int done = 0; 795 int ret; 796 797 while (count) { 798 size_t filled; 799 800 if (count >= 4 && !(*ppos % 4)) { 801 u32 val; 802 803 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 804 *ppos, false); 805 if (ret <= 0) 806 goto read_err; 807 808 if (copy_to_user(buf, &val, sizeof(val))) 809 goto read_err; 810 811 filled = 4; 812 } else if (count >= 2 && !(*ppos % 2)) { 813 u16 val; 814 815 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 816 *ppos, false); 817 if (ret <= 0) 818 goto read_err; 819 820 if (copy_to_user(buf, &val, sizeof(val))) 821 goto read_err; 822 823 filled = 2; 824 } else { 825 u8 val; 826 827 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 828 *ppos, false); 829 if (ret <= 0) 830 goto read_err; 831 832 if (copy_to_user(buf, &val, sizeof(val))) 833 goto read_err; 834 835 filled = 1; 836 } 837 838 count -= filled; 839 done += filled; 840 *ppos += filled; 841 buf += filled; 842 } 843 844 return done; 845 846 read_err: 847 return -EFAULT; 848 } 849 850 static ssize_t mtty_write(struct vfio_device *vdev, const char __user *buf, 851 size_t count, loff_t *ppos) 852 { 853 struct mdev_state *mdev_state = 854 container_of(vdev, struct mdev_state, vdev); 855 unsigned int done = 0; 856 int ret; 857 858 while (count) { 859 size_t filled; 860 861 if (count >= 4 && !(*ppos % 4)) { 862 u32 val; 863 864 if (copy_from_user(&val, buf, sizeof(val))) 865 goto write_err; 866 867 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 868 *ppos, true); 869 if (ret <= 0) 870 goto write_err; 871 872 filled = 4; 873 } else if (count >= 2 && !(*ppos % 2)) { 874 u16 val; 875 876 if (copy_from_user(&val, buf, sizeof(val))) 877 goto write_err; 878 879 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 880 *ppos, true); 881 if (ret <= 0) 882 goto write_err; 883 884 filled = 2; 885 } else { 886 u8 val; 887 888 if (copy_from_user(&val, buf, sizeof(val))) 889 goto write_err; 890 891 ret = mdev_access(mdev_state, (u8 *)&val, sizeof(val), 892 *ppos, true); 893 if (ret <= 0) 894 goto write_err; 895 896 filled = 1; 897 } 898 count -= filled; 899 done += filled; 900 *ppos += filled; 901 buf += filled; 902 } 903 904 return done; 905 write_err: 906 return -EFAULT; 907 } 908 909 static int mtty_set_irqs(struct mdev_state *mdev_state, uint32_t flags, 910 unsigned int index, unsigned int start, 911 unsigned int count, void *data) 912 { 913 int ret = 0; 914 915 mutex_lock(&mdev_state->ops_lock); 916 switch (index) { 917 case VFIO_PCI_INTX_IRQ_INDEX: 918 switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) { 919 case VFIO_IRQ_SET_ACTION_MASK: 920 case VFIO_IRQ_SET_ACTION_UNMASK: 921 break; 922 case VFIO_IRQ_SET_ACTION_TRIGGER: 923 { 924 if (flags & VFIO_IRQ_SET_DATA_NONE) { 925 pr_info("%s: disable INTx\n", __func__); 926 if (mdev_state->intx_evtfd) 927 eventfd_ctx_put(mdev_state->intx_evtfd); 928 break; 929 } 930 931 if (flags & VFIO_IRQ_SET_DATA_EVENTFD) { 932 int fd = *(int *)data; 933 934 if (fd > 0) { 935 struct eventfd_ctx *evt; 936 937 evt = eventfd_ctx_fdget(fd); 938 if (IS_ERR(evt)) { 939 ret = PTR_ERR(evt); 940 break; 941 } 942 mdev_state->intx_evtfd = evt; 943 mdev_state->irq_fd = fd; 944 mdev_state->irq_index = index; 945 break; 946 } 947 } 948 break; 949 } 950 } 951 break; 952 case VFIO_PCI_MSI_IRQ_INDEX: 953 switch (flags & VFIO_IRQ_SET_ACTION_TYPE_MASK) { 954 case VFIO_IRQ_SET_ACTION_MASK: 955 case VFIO_IRQ_SET_ACTION_UNMASK: 956 break; 957 case VFIO_IRQ_SET_ACTION_TRIGGER: 958 if (flags & VFIO_IRQ_SET_DATA_NONE) { 959 if (mdev_state->msi_evtfd) 960 eventfd_ctx_put(mdev_state->msi_evtfd); 961 pr_info("%s: disable MSI\n", __func__); 962 mdev_state->irq_index = VFIO_PCI_INTX_IRQ_INDEX; 963 break; 964 } 965 if (flags & VFIO_IRQ_SET_DATA_EVENTFD) { 966 int fd = *(int *)data; 967 struct eventfd_ctx *evt; 968 969 if (fd <= 0) 970 break; 971 972 if (mdev_state->msi_evtfd) 973 break; 974 975 evt = eventfd_ctx_fdget(fd); 976 if (IS_ERR(evt)) { 977 ret = PTR_ERR(evt); 978 break; 979 } 980 mdev_state->msi_evtfd = evt; 981 mdev_state->irq_fd = fd; 982 mdev_state->irq_index = index; 983 } 984 break; 985 } 986 break; 987 case VFIO_PCI_MSIX_IRQ_INDEX: 988 pr_info("%s: MSIX_IRQ\n", __func__); 989 break; 990 case VFIO_PCI_ERR_IRQ_INDEX: 991 pr_info("%s: ERR_IRQ\n", __func__); 992 break; 993 case VFIO_PCI_REQ_IRQ_INDEX: 994 pr_info("%s: REQ_IRQ\n", __func__); 995 break; 996 } 997 998 mutex_unlock(&mdev_state->ops_lock); 999 return ret; 1000 } 1001 1002 static int mtty_trigger_interrupt(struct mdev_state *mdev_state) 1003 { 1004 int ret = -1; 1005 1006 if ((mdev_state->irq_index == VFIO_PCI_MSI_IRQ_INDEX) && 1007 (!mdev_state->msi_evtfd)) 1008 return -EINVAL; 1009 else if ((mdev_state->irq_index == VFIO_PCI_INTX_IRQ_INDEX) && 1010 (!mdev_state->intx_evtfd)) { 1011 pr_info("%s: Intr eventfd not found\n", __func__); 1012 return -EINVAL; 1013 } 1014 1015 if (mdev_state->irq_index == VFIO_PCI_MSI_IRQ_INDEX) 1016 ret = eventfd_signal(mdev_state->msi_evtfd, 1); 1017 else 1018 ret = eventfd_signal(mdev_state->intx_evtfd, 1); 1019 1020 #if defined(DEBUG_INTR) 1021 pr_info("Intx triggered\n"); 1022 #endif 1023 if (ret != 1) 1024 pr_err("%s: eventfd signal failed (%d)\n", __func__, ret); 1025 1026 return ret; 1027 } 1028 1029 static int mtty_get_region_info(struct mdev_state *mdev_state, 1030 struct vfio_region_info *region_info, 1031 u16 *cap_type_id, void **cap_type) 1032 { 1033 unsigned int size = 0; 1034 u32 bar_index; 1035 1036 bar_index = region_info->index; 1037 if (bar_index >= VFIO_PCI_NUM_REGIONS) 1038 return -EINVAL; 1039 1040 mutex_lock(&mdev_state->ops_lock); 1041 1042 switch (bar_index) { 1043 case VFIO_PCI_CONFIG_REGION_INDEX: 1044 size = MTTY_CONFIG_SPACE_SIZE; 1045 break; 1046 case VFIO_PCI_BAR0_REGION_INDEX: 1047 size = MTTY_IO_BAR_SIZE; 1048 break; 1049 case VFIO_PCI_BAR1_REGION_INDEX: 1050 if (mdev_state->nr_ports == 2) 1051 size = MTTY_IO_BAR_SIZE; 1052 break; 1053 default: 1054 size = 0; 1055 break; 1056 } 1057 1058 mdev_state->region_info[bar_index].size = size; 1059 mdev_state->region_info[bar_index].vfio_offset = 1060 MTTY_VFIO_PCI_INDEX_TO_OFFSET(bar_index); 1061 1062 region_info->size = size; 1063 region_info->offset = MTTY_VFIO_PCI_INDEX_TO_OFFSET(bar_index); 1064 region_info->flags = VFIO_REGION_INFO_FLAG_READ | 1065 VFIO_REGION_INFO_FLAG_WRITE; 1066 mutex_unlock(&mdev_state->ops_lock); 1067 return 0; 1068 } 1069 1070 static int mtty_get_irq_info(struct vfio_irq_info *irq_info) 1071 { 1072 switch (irq_info->index) { 1073 case VFIO_PCI_INTX_IRQ_INDEX: 1074 case VFIO_PCI_MSI_IRQ_INDEX: 1075 case VFIO_PCI_REQ_IRQ_INDEX: 1076 break; 1077 1078 default: 1079 return -EINVAL; 1080 } 1081 1082 irq_info->flags = VFIO_IRQ_INFO_EVENTFD; 1083 irq_info->count = 1; 1084 1085 if (irq_info->index == VFIO_PCI_INTX_IRQ_INDEX) 1086 irq_info->flags |= (VFIO_IRQ_INFO_MASKABLE | 1087 VFIO_IRQ_INFO_AUTOMASKED); 1088 else 1089 irq_info->flags |= VFIO_IRQ_INFO_NORESIZE; 1090 1091 return 0; 1092 } 1093 1094 static int mtty_get_device_info(struct vfio_device_info *dev_info) 1095 { 1096 dev_info->flags = VFIO_DEVICE_FLAGS_PCI; 1097 dev_info->num_regions = VFIO_PCI_NUM_REGIONS; 1098 dev_info->num_irqs = VFIO_PCI_NUM_IRQS; 1099 1100 return 0; 1101 } 1102 1103 static long mtty_ioctl(struct vfio_device *vdev, unsigned int cmd, 1104 unsigned long arg) 1105 { 1106 struct mdev_state *mdev_state = 1107 container_of(vdev, struct mdev_state, vdev); 1108 int ret = 0; 1109 unsigned long minsz; 1110 1111 switch (cmd) { 1112 case VFIO_DEVICE_GET_INFO: 1113 { 1114 struct vfio_device_info info; 1115 1116 minsz = offsetofend(struct vfio_device_info, num_irqs); 1117 1118 if (copy_from_user(&info, (void __user *)arg, minsz)) 1119 return -EFAULT; 1120 1121 if (info.argsz < minsz) 1122 return -EINVAL; 1123 1124 ret = mtty_get_device_info(&info); 1125 if (ret) 1126 return ret; 1127 1128 memcpy(&mdev_state->dev_info, &info, sizeof(info)); 1129 1130 if (copy_to_user((void __user *)arg, &info, minsz)) 1131 return -EFAULT; 1132 1133 return 0; 1134 } 1135 case VFIO_DEVICE_GET_REGION_INFO: 1136 { 1137 struct vfio_region_info info; 1138 u16 cap_type_id = 0; 1139 void *cap_type = NULL; 1140 1141 minsz = offsetofend(struct vfio_region_info, offset); 1142 1143 if (copy_from_user(&info, (void __user *)arg, minsz)) 1144 return -EFAULT; 1145 1146 if (info.argsz < minsz) 1147 return -EINVAL; 1148 1149 ret = mtty_get_region_info(mdev_state, &info, &cap_type_id, 1150 &cap_type); 1151 if (ret) 1152 return ret; 1153 1154 if (copy_to_user((void __user *)arg, &info, minsz)) 1155 return -EFAULT; 1156 1157 return 0; 1158 } 1159 1160 case VFIO_DEVICE_GET_IRQ_INFO: 1161 { 1162 struct vfio_irq_info info; 1163 1164 minsz = offsetofend(struct vfio_irq_info, count); 1165 1166 if (copy_from_user(&info, (void __user *)arg, minsz)) 1167 return -EFAULT; 1168 1169 if ((info.argsz < minsz) || 1170 (info.index >= mdev_state->dev_info.num_irqs)) 1171 return -EINVAL; 1172 1173 ret = mtty_get_irq_info(&info); 1174 if (ret) 1175 return ret; 1176 1177 if (copy_to_user((void __user *)arg, &info, minsz)) 1178 return -EFAULT; 1179 1180 return 0; 1181 } 1182 case VFIO_DEVICE_SET_IRQS: 1183 { 1184 struct vfio_irq_set hdr; 1185 u8 *data = NULL, *ptr = NULL; 1186 size_t data_size = 0; 1187 1188 minsz = offsetofend(struct vfio_irq_set, count); 1189 1190 if (copy_from_user(&hdr, (void __user *)arg, minsz)) 1191 return -EFAULT; 1192 1193 ret = vfio_set_irqs_validate_and_prepare(&hdr, 1194 mdev_state->dev_info.num_irqs, 1195 VFIO_PCI_NUM_IRQS, 1196 &data_size); 1197 if (ret) 1198 return ret; 1199 1200 if (data_size) { 1201 ptr = data = memdup_user((void __user *)(arg + minsz), 1202 data_size); 1203 if (IS_ERR(data)) 1204 return PTR_ERR(data); 1205 } 1206 1207 ret = mtty_set_irqs(mdev_state, hdr.flags, hdr.index, hdr.start, 1208 hdr.count, data); 1209 1210 kfree(ptr); 1211 return ret; 1212 } 1213 case VFIO_DEVICE_RESET: 1214 return mtty_reset(mdev_state); 1215 } 1216 return -ENOTTY; 1217 } 1218 1219 static ssize_t 1220 sample_mdev_dev_show(struct device *dev, struct device_attribute *attr, 1221 char *buf) 1222 { 1223 return sprintf(buf, "This is MDEV %s\n", dev_name(dev)); 1224 } 1225 1226 static DEVICE_ATTR_RO(sample_mdev_dev); 1227 1228 static struct attribute *mdev_dev_attrs[] = { 1229 &dev_attr_sample_mdev_dev.attr, 1230 NULL, 1231 }; 1232 1233 static const struct attribute_group mdev_dev_group = { 1234 .name = "vendor", 1235 .attrs = mdev_dev_attrs, 1236 }; 1237 1238 static const struct attribute_group *mdev_dev_groups[] = { 1239 &mdev_dev_group, 1240 NULL, 1241 }; 1242 1243 static ssize_t name_show(struct mdev_type *mtype, 1244 struct mdev_type_attribute *attr, char *buf) 1245 { 1246 static const char *name_str[2] = { "Single port serial", 1247 "Dual port serial" }; 1248 1249 return sysfs_emit(buf, "%s\n", 1250 name_str[mtype_get_type_group_id(mtype)]); 1251 } 1252 1253 static MDEV_TYPE_ATTR_RO(name); 1254 1255 static ssize_t available_instances_show(struct mdev_type *mtype, 1256 struct mdev_type_attribute *attr, 1257 char *buf) 1258 { 1259 unsigned int ports = mtype_get_type_group_id(mtype) + 1; 1260 1261 return sprintf(buf, "%d\n", atomic_read(&mdev_avail_ports) / ports); 1262 } 1263 1264 static MDEV_TYPE_ATTR_RO(available_instances); 1265 1266 static ssize_t device_api_show(struct mdev_type *mtype, 1267 struct mdev_type_attribute *attr, char *buf) 1268 { 1269 return sprintf(buf, "%s\n", VFIO_DEVICE_API_PCI_STRING); 1270 } 1271 1272 static MDEV_TYPE_ATTR_RO(device_api); 1273 1274 static struct attribute *mdev_types_attrs[] = { 1275 &mdev_type_attr_name.attr, 1276 &mdev_type_attr_device_api.attr, 1277 &mdev_type_attr_available_instances.attr, 1278 NULL, 1279 }; 1280 1281 static struct attribute_group mdev_type_group1 = { 1282 .name = "1", 1283 .attrs = mdev_types_attrs, 1284 }; 1285 1286 static struct attribute_group mdev_type_group2 = { 1287 .name = "2", 1288 .attrs = mdev_types_attrs, 1289 }; 1290 1291 static struct attribute_group *mdev_type_groups[] = { 1292 &mdev_type_group1, 1293 &mdev_type_group2, 1294 NULL, 1295 }; 1296 1297 static const struct vfio_device_ops mtty_dev_ops = { 1298 .name = "vfio-mtty", 1299 .init = mtty_init_dev, 1300 .release = mtty_release_dev, 1301 .read = mtty_read, 1302 .write = mtty_write, 1303 .ioctl = mtty_ioctl, 1304 }; 1305 1306 static struct mdev_driver mtty_driver = { 1307 .driver = { 1308 .name = "mtty", 1309 .owner = THIS_MODULE, 1310 .mod_name = KBUILD_MODNAME, 1311 .dev_groups = mdev_dev_groups, 1312 }, 1313 .probe = mtty_probe, 1314 .remove = mtty_remove, 1315 .supported_type_groups = mdev_type_groups, 1316 }; 1317 1318 static void mtty_device_release(struct device *dev) 1319 { 1320 dev_dbg(dev, "mtty: released\n"); 1321 } 1322 1323 static int __init mtty_dev_init(void) 1324 { 1325 int ret = 0; 1326 1327 pr_info("mtty_dev: %s\n", __func__); 1328 1329 memset(&mtty_dev, 0, sizeof(mtty_dev)); 1330 1331 idr_init(&mtty_dev.vd_idr); 1332 1333 ret = alloc_chrdev_region(&mtty_dev.vd_devt, 0, MINORMASK + 1, 1334 MTTY_NAME); 1335 1336 if (ret < 0) { 1337 pr_err("Error: failed to register mtty_dev, err:%d\n", ret); 1338 return ret; 1339 } 1340 1341 cdev_init(&mtty_dev.vd_cdev, &vd_fops); 1342 cdev_add(&mtty_dev.vd_cdev, mtty_dev.vd_devt, MINORMASK + 1); 1343 1344 pr_info("major_number:%d\n", MAJOR(mtty_dev.vd_devt)); 1345 1346 ret = mdev_register_driver(&mtty_driver); 1347 if (ret) 1348 goto err_cdev; 1349 1350 mtty_dev.vd_class = class_create(THIS_MODULE, MTTY_CLASS_NAME); 1351 1352 if (IS_ERR(mtty_dev.vd_class)) { 1353 pr_err("Error: failed to register mtty_dev class\n"); 1354 ret = PTR_ERR(mtty_dev.vd_class); 1355 goto err_driver; 1356 } 1357 1358 mtty_dev.dev.class = mtty_dev.vd_class; 1359 mtty_dev.dev.release = mtty_device_release; 1360 dev_set_name(&mtty_dev.dev, "%s", MTTY_NAME); 1361 1362 ret = device_register(&mtty_dev.dev); 1363 if (ret) 1364 goto err_class; 1365 1366 ret = mdev_register_device(&mtty_dev.dev, &mtty_driver); 1367 if (ret) 1368 goto err_device; 1369 return 0; 1370 1371 err_device: 1372 device_unregister(&mtty_dev.dev); 1373 err_class: 1374 class_destroy(mtty_dev.vd_class); 1375 err_driver: 1376 mdev_unregister_driver(&mtty_driver); 1377 err_cdev: 1378 cdev_del(&mtty_dev.vd_cdev); 1379 unregister_chrdev_region(mtty_dev.vd_devt, MINORMASK + 1); 1380 return ret; 1381 } 1382 1383 static void __exit mtty_dev_exit(void) 1384 { 1385 mtty_dev.dev.bus = NULL; 1386 mdev_unregister_device(&mtty_dev.dev); 1387 1388 device_unregister(&mtty_dev.dev); 1389 idr_destroy(&mtty_dev.vd_idr); 1390 mdev_unregister_driver(&mtty_driver); 1391 cdev_del(&mtty_dev.vd_cdev); 1392 unregister_chrdev_region(mtty_dev.vd_devt, MINORMASK + 1); 1393 class_destroy(mtty_dev.vd_class); 1394 mtty_dev.vd_class = NULL; 1395 pr_info("mtty_dev: Unloaded!\n"); 1396 } 1397 1398 module_init(mtty_dev_init) 1399 module_exit(mtty_dev_exit) 1400 1401 MODULE_LICENSE("GPL v2"); 1402 MODULE_INFO(supported, "Test driver that simulate serial port over PCI"); 1403 MODULE_VERSION(VERSION_STRING); 1404 MODULE_AUTHOR(DRIVER_AUTHOR); 1405