1 /* 2 * msi.c 3 * 4 * Copyright (c) 2010 Isaku Yamahata <yamahata at valinux co jp> 5 * VA Linux Systems Japan K.K. 6 * 7 * This program is free software; you can redistribute it and/or modify 8 * it under the terms of the GNU General Public License as published by 9 * the Free Software Foundation; either version 2 of the License, or 10 * (at your option) any later version. 11 12 * This program is distributed in the hope that it will be useful, 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 15 * GNU General Public License for more details. 16 17 * You should have received a copy of the GNU General Public License along 18 * with this program; if not, see <http://www.gnu.org/licenses/>. 19 */ 20 21 #include "qemu/osdep.h" 22 #include "hw/pci/msi.h" 23 #include "hw/xen/xen.h" 24 #include "qemu/range.h" 25 #include "qapi/error.h" 26 27 /* PCI_MSI_ADDRESS_LO */ 28 #define PCI_MSI_ADDRESS_LO_MASK (~0x3) 29 30 /* If we get rid of cap allocator, we won't need those. */ 31 #define PCI_MSI_32_SIZEOF 0x0a 32 #define PCI_MSI_64_SIZEOF 0x0e 33 #define PCI_MSI_32M_SIZEOF 0x14 34 #define PCI_MSI_64M_SIZEOF 0x18 35 36 #define PCI_MSI_VECTORS_MAX 32 37 38 /* 39 * Flag for interrupt controllers to declare broken MSI/MSI-X support. 40 * values: false - broken; true - non-broken. 41 * 42 * Setting this flag to false will remove MSI/MSI-X capability from all devices. 43 * 44 * It is preferable for controllers to set this to true (non-broken) even if 45 * they do not actually support MSI/MSI-X: guests normally probe the controller 46 * type and do not attempt to enable MSI/MSI-X with interrupt controllers not 47 * supporting such, so removing the capability is not required, and 48 * it seems cleaner to have a given device look the same for all boards. 49 * 50 * TODO: some existing controllers violate the above rule. Identify and fix them. 51 */ 52 bool msi_nonbroken; 53 54 /* If we get rid of cap allocator, we won't need this. */ 55 static inline uint8_t msi_cap_sizeof(uint16_t flags) 56 { 57 switch (flags & (PCI_MSI_FLAGS_MASKBIT | PCI_MSI_FLAGS_64BIT)) { 58 case PCI_MSI_FLAGS_MASKBIT | PCI_MSI_FLAGS_64BIT: 59 return PCI_MSI_64M_SIZEOF; 60 case PCI_MSI_FLAGS_64BIT: 61 return PCI_MSI_64_SIZEOF; 62 case PCI_MSI_FLAGS_MASKBIT: 63 return PCI_MSI_32M_SIZEOF; 64 case 0: 65 return PCI_MSI_32_SIZEOF; 66 default: 67 abort(); 68 break; 69 } 70 return 0; 71 } 72 73 //#define MSI_DEBUG 74 75 #ifdef MSI_DEBUG 76 # define MSI_DPRINTF(fmt, ...) \ 77 fprintf(stderr, "%s:%d " fmt, __func__, __LINE__, ## __VA_ARGS__) 78 #else 79 # define MSI_DPRINTF(fmt, ...) do { } while (0) 80 #endif 81 #define MSI_DEV_PRINTF(dev, fmt, ...) \ 82 MSI_DPRINTF("%s:%x " fmt, (dev)->name, (dev)->devfn, ## __VA_ARGS__) 83 84 static inline unsigned int msi_nr_vectors(uint16_t flags) 85 { 86 return 1U << 87 ((flags & PCI_MSI_FLAGS_QSIZE) >> ctz32(PCI_MSI_FLAGS_QSIZE)); 88 } 89 90 static inline uint8_t msi_flags_off(const PCIDevice* dev) 91 { 92 return dev->msi_cap + PCI_MSI_FLAGS; 93 } 94 95 static inline uint8_t msi_address_lo_off(const PCIDevice* dev) 96 { 97 return dev->msi_cap + PCI_MSI_ADDRESS_LO; 98 } 99 100 static inline uint8_t msi_address_hi_off(const PCIDevice* dev) 101 { 102 return dev->msi_cap + PCI_MSI_ADDRESS_HI; 103 } 104 105 static inline uint8_t msi_data_off(const PCIDevice* dev, bool msi64bit) 106 { 107 return dev->msi_cap + (msi64bit ? PCI_MSI_DATA_64 : PCI_MSI_DATA_32); 108 } 109 110 static inline uint8_t msi_mask_off(const PCIDevice* dev, bool msi64bit) 111 { 112 return dev->msi_cap + (msi64bit ? PCI_MSI_MASK_64 : PCI_MSI_MASK_32); 113 } 114 115 static inline uint8_t msi_pending_off(const PCIDevice* dev, bool msi64bit) 116 { 117 return dev->msi_cap + (msi64bit ? PCI_MSI_PENDING_64 : PCI_MSI_PENDING_32); 118 } 119 120 /* 121 * Special API for POWER to configure the vectors through 122 * a side channel. Should never be used by devices. 123 */ 124 void msi_set_message(PCIDevice *dev, MSIMessage msg) 125 { 126 uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev)); 127 bool msi64bit = flags & PCI_MSI_FLAGS_64BIT; 128 129 if (msi64bit) { 130 pci_set_quad(dev->config + msi_address_lo_off(dev), msg.address); 131 } else { 132 pci_set_long(dev->config + msi_address_lo_off(dev), msg.address); 133 } 134 pci_set_word(dev->config + msi_data_off(dev, msi64bit), msg.data); 135 } 136 137 static MSIMessage msi_prepare_message(PCIDevice *dev, unsigned int vector) 138 { 139 uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev)); 140 bool msi64bit = flags & PCI_MSI_FLAGS_64BIT; 141 unsigned int nr_vectors = msi_nr_vectors(flags); 142 MSIMessage msg; 143 144 assert(vector < nr_vectors); 145 146 if (msi64bit) { 147 msg.address = pci_get_quad(dev->config + msi_address_lo_off(dev)); 148 } else { 149 msg.address = pci_get_long(dev->config + msi_address_lo_off(dev)); 150 } 151 152 /* upper bit 31:16 is zero */ 153 msg.data = pci_get_word(dev->config + msi_data_off(dev, msi64bit)); 154 if (nr_vectors > 1) { 155 msg.data &= ~(nr_vectors - 1); 156 msg.data |= vector; 157 } 158 159 return msg; 160 } 161 162 MSIMessage msi_get_message(PCIDevice *dev, unsigned int vector) 163 { 164 return dev->msi_prepare_message(dev, vector); 165 } 166 167 bool msi_enabled(const PCIDevice *dev) 168 { 169 return msi_present(dev) && 170 (pci_get_word(dev->config + msi_flags_off(dev)) & 171 PCI_MSI_FLAGS_ENABLE); 172 } 173 174 /* 175 * Make PCI device @dev MSI-capable. 176 * Non-zero @offset puts capability MSI at that offset in PCI config 177 * space. 178 * @nr_vectors is the number of MSI vectors (1, 2, 4, 8, 16 or 32). 179 * If @msi64bit, make the device capable of sending a 64-bit message 180 * address. 181 * If @msi_per_vector_mask, make the device support per-vector masking. 182 * @errp is for returning errors. 183 * Return 0 on success; set @errp and return -errno on error. 184 * 185 * -ENOTSUP means lacking msi support for a msi-capable platform. 186 * -EINVAL means capability overlap, happens when @offset is non-zero, 187 * also means a programming error, except device assignment, which can check 188 * if a real HW is broken. 189 */ 190 int msi_init(struct PCIDevice *dev, uint8_t offset, 191 unsigned int nr_vectors, bool msi64bit, 192 bool msi_per_vector_mask, Error **errp) 193 { 194 unsigned int vectors_order; 195 uint16_t flags; 196 uint8_t cap_size; 197 int config_offset; 198 199 if (!msi_nonbroken) { 200 error_setg(errp, "MSI is not supported by interrupt controller"); 201 return -ENOTSUP; 202 } 203 204 MSI_DEV_PRINTF(dev, 205 "init offset: 0x%"PRIx8" vector: %"PRId8 206 " 64bit %d mask %d\n", 207 offset, nr_vectors, msi64bit, msi_per_vector_mask); 208 209 assert(!(nr_vectors & (nr_vectors - 1))); /* power of 2 */ 210 assert(nr_vectors > 0); 211 assert(nr_vectors <= PCI_MSI_VECTORS_MAX); 212 /* the nr of MSI vectors is up to 32 */ 213 vectors_order = ctz32(nr_vectors); 214 215 flags = vectors_order << ctz32(PCI_MSI_FLAGS_QMASK); 216 if (msi64bit) { 217 flags |= PCI_MSI_FLAGS_64BIT; 218 } 219 if (msi_per_vector_mask) { 220 flags |= PCI_MSI_FLAGS_MASKBIT; 221 } 222 223 cap_size = msi_cap_sizeof(flags); 224 config_offset = pci_add_capability(dev, PCI_CAP_ID_MSI, offset, 225 cap_size, errp); 226 if (config_offset < 0) { 227 return config_offset; 228 } 229 230 dev->msi_cap = config_offset; 231 dev->cap_present |= QEMU_PCI_CAP_MSI; 232 233 pci_set_word(dev->config + msi_flags_off(dev), flags); 234 pci_set_word(dev->wmask + msi_flags_off(dev), 235 PCI_MSI_FLAGS_QSIZE | PCI_MSI_FLAGS_ENABLE); 236 pci_set_long(dev->wmask + msi_address_lo_off(dev), 237 PCI_MSI_ADDRESS_LO_MASK); 238 if (msi64bit) { 239 pci_set_long(dev->wmask + msi_address_hi_off(dev), 0xffffffff); 240 } 241 pci_set_word(dev->wmask + msi_data_off(dev, msi64bit), 0xffff); 242 243 if (msi_per_vector_mask) { 244 /* Make mask bits 0 to nr_vectors - 1 writable. */ 245 pci_set_long(dev->wmask + msi_mask_off(dev, msi64bit), 246 0xffffffff >> (PCI_MSI_VECTORS_MAX - nr_vectors)); 247 } 248 249 dev->msi_prepare_message = msi_prepare_message; 250 251 return 0; 252 } 253 254 void msi_uninit(struct PCIDevice *dev) 255 { 256 uint16_t flags; 257 uint8_t cap_size; 258 259 if (!msi_present(dev)) { 260 return; 261 } 262 flags = pci_get_word(dev->config + msi_flags_off(dev)); 263 cap_size = msi_cap_sizeof(flags); 264 pci_del_capability(dev, PCI_CAP_ID_MSI, cap_size); 265 dev->cap_present &= ~QEMU_PCI_CAP_MSI; 266 dev->msi_prepare_message = NULL; 267 268 MSI_DEV_PRINTF(dev, "uninit\n"); 269 } 270 271 void msi_reset(PCIDevice *dev) 272 { 273 uint16_t flags; 274 bool msi64bit; 275 276 if (!msi_present(dev)) { 277 return; 278 } 279 280 flags = pci_get_word(dev->config + msi_flags_off(dev)); 281 flags &= ~(PCI_MSI_FLAGS_QSIZE | PCI_MSI_FLAGS_ENABLE); 282 msi64bit = flags & PCI_MSI_FLAGS_64BIT; 283 284 pci_set_word(dev->config + msi_flags_off(dev), flags); 285 pci_set_long(dev->config + msi_address_lo_off(dev), 0); 286 if (msi64bit) { 287 pci_set_long(dev->config + msi_address_hi_off(dev), 0); 288 } 289 pci_set_word(dev->config + msi_data_off(dev, msi64bit), 0); 290 if (flags & PCI_MSI_FLAGS_MASKBIT) { 291 pci_set_long(dev->config + msi_mask_off(dev, msi64bit), 0); 292 pci_set_long(dev->config + msi_pending_off(dev, msi64bit), 0); 293 } 294 MSI_DEV_PRINTF(dev, "reset\n"); 295 } 296 297 bool msi_is_masked(const PCIDevice *dev, unsigned int vector) 298 { 299 uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev)); 300 uint32_t mask, data; 301 bool msi64bit = flags & PCI_MSI_FLAGS_64BIT; 302 assert(vector < PCI_MSI_VECTORS_MAX); 303 304 if (!(flags & PCI_MSI_FLAGS_MASKBIT)) { 305 return false; 306 } 307 308 data = pci_get_word(dev->config + msi_data_off(dev, msi64bit)); 309 if (xen_is_pirq_msi(data)) { 310 return false; 311 } 312 313 mask = pci_get_long(dev->config + 314 msi_mask_off(dev, flags & PCI_MSI_FLAGS_64BIT)); 315 return mask & (1U << vector); 316 } 317 318 void msi_set_mask(PCIDevice *dev, int vector, bool mask, Error **errp) 319 { 320 ERRP_GUARD(); 321 uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev)); 322 bool msi64bit = flags & PCI_MSI_FLAGS_64BIT; 323 uint32_t irq_state, vector_mask, pending; 324 325 if (vector > PCI_MSI_VECTORS_MAX) { 326 error_setg(errp, "msi: vector %d not allocated. max vector is %d", 327 vector, PCI_MSI_VECTORS_MAX); 328 return; 329 } 330 331 vector_mask = (1U << vector); 332 333 irq_state = pci_get_long(dev->config + msi_mask_off(dev, msi64bit)); 334 335 if (mask) { 336 irq_state |= vector_mask; 337 } else { 338 irq_state &= ~vector_mask; 339 } 340 341 pci_set_long(dev->config + msi_mask_off(dev, msi64bit), irq_state); 342 343 pending = pci_get_long(dev->config + msi_pending_off(dev, msi64bit)); 344 if (!mask && (pending & vector_mask)) { 345 pending &= ~vector_mask; 346 pci_set_long(dev->config + msi_pending_off(dev, msi64bit), pending); 347 msi_notify(dev, vector); 348 } 349 } 350 351 void msi_notify(PCIDevice *dev, unsigned int vector) 352 { 353 uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev)); 354 bool msi64bit = flags & PCI_MSI_FLAGS_64BIT; 355 unsigned int nr_vectors = msi_nr_vectors(flags); 356 MSIMessage msg; 357 358 assert(vector < nr_vectors); 359 if (msi_is_masked(dev, vector)) { 360 assert(flags & PCI_MSI_FLAGS_MASKBIT); 361 pci_long_test_and_set_mask( 362 dev->config + msi_pending_off(dev, msi64bit), 1U << vector); 363 MSI_DEV_PRINTF(dev, "pending vector 0x%x\n", vector); 364 return; 365 } 366 367 msg = msi_get_message(dev, vector); 368 369 MSI_DEV_PRINTF(dev, 370 "notify vector 0x%x" 371 " address: 0x%"PRIx64" data: 0x%"PRIx32"\n", 372 vector, msg.address, msg.data); 373 msi_send_message(dev, msg); 374 } 375 376 void msi_send_message(PCIDevice *dev, MSIMessage msg) 377 { 378 dev->msi_trigger(dev, msg); 379 } 380 381 /* Normally called by pci_default_write_config(). */ 382 void msi_write_config(PCIDevice *dev, uint32_t addr, uint32_t val, int len) 383 { 384 uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev)); 385 bool msi64bit = flags & PCI_MSI_FLAGS_64BIT; 386 bool msi_per_vector_mask = flags & PCI_MSI_FLAGS_MASKBIT; 387 unsigned int nr_vectors; 388 uint8_t log_num_vecs; 389 uint8_t log_max_vecs; 390 unsigned int vector; 391 uint32_t pending; 392 393 if (!msi_present(dev) || 394 !ranges_overlap(addr, len, dev->msi_cap, msi_cap_sizeof(flags))) { 395 return; 396 } 397 398 #ifdef MSI_DEBUG 399 MSI_DEV_PRINTF(dev, "addr 0x%"PRIx32" val 0x%"PRIx32" len %d\n", 400 addr, val, len); 401 MSI_DEV_PRINTF(dev, "ctrl: 0x%"PRIx16" address: 0x%"PRIx32, 402 flags, 403 pci_get_long(dev->config + msi_address_lo_off(dev))); 404 if (msi64bit) { 405 fprintf(stderr, " address-hi: 0x%"PRIx32, 406 pci_get_long(dev->config + msi_address_hi_off(dev))); 407 } 408 fprintf(stderr, " data: 0x%"PRIx16, 409 pci_get_word(dev->config + msi_data_off(dev, msi64bit))); 410 if (flags & PCI_MSI_FLAGS_MASKBIT) { 411 fprintf(stderr, " mask 0x%"PRIx32" pending 0x%"PRIx32, 412 pci_get_long(dev->config + msi_mask_off(dev, msi64bit)), 413 pci_get_long(dev->config + msi_pending_off(dev, msi64bit))); 414 } 415 fprintf(stderr, "\n"); 416 #endif 417 418 if (!(flags & PCI_MSI_FLAGS_ENABLE)) { 419 return; 420 } 421 422 /* 423 * Now MSI is enabled, clear INTx# interrupts. 424 * the driver is prohibited from writing enable bit to mask 425 * a service request. But the guest OS could do this. 426 * So we just discard the interrupts as moderate fallback. 427 * 428 * 6.8.3.3. Enabling Operation 429 * While enabled for MSI or MSI-X operation, a function is prohibited 430 * from using its INTx# pin (if implemented) to request 431 * service (MSI, MSI-X, and INTx# are mutually exclusive). 432 */ 433 pci_device_deassert_intx(dev); 434 435 /* 436 * nr_vectors might be set bigger than capable. So clamp it. 437 * This is not legal by spec, so we can do anything we like, 438 * just don't crash the host 439 */ 440 log_num_vecs = 441 (flags & PCI_MSI_FLAGS_QSIZE) >> ctz32(PCI_MSI_FLAGS_QSIZE); 442 log_max_vecs = 443 (flags & PCI_MSI_FLAGS_QMASK) >> ctz32(PCI_MSI_FLAGS_QMASK); 444 if (log_num_vecs > log_max_vecs) { 445 flags &= ~PCI_MSI_FLAGS_QSIZE; 446 flags |= log_max_vecs << ctz32(PCI_MSI_FLAGS_QSIZE); 447 pci_set_word(dev->config + msi_flags_off(dev), flags); 448 } 449 450 if (!msi_per_vector_mask) { 451 /* if per vector masking isn't supported, 452 there is no pending interrupt. */ 453 return; 454 } 455 456 nr_vectors = msi_nr_vectors(flags); 457 458 /* This will discard pending interrupts, if any. */ 459 pending = pci_get_long(dev->config + msi_pending_off(dev, msi64bit)); 460 pending &= 0xffffffff >> (PCI_MSI_VECTORS_MAX - nr_vectors); 461 pci_set_long(dev->config + msi_pending_off(dev, msi64bit), pending); 462 463 /* deliver pending interrupts which are unmasked */ 464 for (vector = 0; vector < nr_vectors; ++vector) { 465 if (msi_is_masked(dev, vector) || !(pending & (1U << vector))) { 466 continue; 467 } 468 469 pci_long_test_and_clear_mask( 470 dev->config + msi_pending_off(dev, msi64bit), 1U << vector); 471 msi_notify(dev, vector); 472 } 473 } 474 475 unsigned int msi_nr_vectors_allocated(const PCIDevice *dev) 476 { 477 uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev)); 478 return msi_nr_vectors(flags); 479 } 480