qemu/hw/pci/msi.c
<<
>>
Prefs
   1/*
   2 * msi.c
   3 *
   4 * Copyright (c) 2010 Isaku Yamahata <yamahata at valinux co jp>
   5 *                    VA Linux Systems Japan K.K.
   6 *
   7 * This program is free software; you can redistribute it and/or modify
   8 * it under the terms of the GNU General Public License as published by
   9 * the Free Software Foundation; either version 2 of the License, or
  10 * (at your option) any later version.
  11
  12 * This program is distributed in the hope that it will be useful,
  13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  15 * GNU General Public License for more details.
  16
  17 * You should have received a copy of the GNU General Public License along
  18 * with this program; if not, see <http://www.gnu.org/licenses/>.
  19 */
  20
  21#include "qemu/osdep.h"
  22#include "hw/pci/msi.h"
  23#include "hw/xen/xen.h"
  24#include "qemu/range.h"
  25#include "qapi/error.h"
  26
  27/* PCI_MSI_ADDRESS_LO */
  28#define PCI_MSI_ADDRESS_LO_MASK         (~0x3)
  29
  30/* If we get rid of cap allocator, we won't need those. */
  31#define PCI_MSI_32_SIZEOF       0x0a
  32#define PCI_MSI_64_SIZEOF       0x0e
  33#define PCI_MSI_32M_SIZEOF      0x14
  34#define PCI_MSI_64M_SIZEOF      0x18
  35
  36#define PCI_MSI_VECTORS_MAX     32
  37
  38/*
  39 * Flag for interrupt controllers to declare broken MSI/MSI-X support.
  40 * values: false - broken; true - non-broken.
  41 *
  42 * Setting this flag to false will remove MSI/MSI-X capability from all devices.
  43 *
  44 * It is preferable for controllers to set this to true (non-broken) even if
  45 * they do not actually support MSI/MSI-X: guests normally probe the controller
  46 * type and do not attempt to enable MSI/MSI-X with interrupt controllers not
  47 * supporting such, so removing the capability is not required, and
  48 * it seems cleaner to have a given device look the same for all boards.
  49 *
  50 * TODO: some existing controllers violate the above rule. Identify and fix them.
  51 */
  52bool msi_nonbroken;
  53
  54/* If we get rid of cap allocator, we won't need this. */
  55static inline uint8_t msi_cap_sizeof(uint16_t flags)
  56{
  57    switch (flags & (PCI_MSI_FLAGS_MASKBIT | PCI_MSI_FLAGS_64BIT)) {
  58    case PCI_MSI_FLAGS_MASKBIT | PCI_MSI_FLAGS_64BIT:
  59        return PCI_MSI_64M_SIZEOF;
  60    case PCI_MSI_FLAGS_64BIT:
  61        return PCI_MSI_64_SIZEOF;
  62    case PCI_MSI_FLAGS_MASKBIT:
  63        return PCI_MSI_32M_SIZEOF;
  64    case 0:
  65        return PCI_MSI_32_SIZEOF;
  66    default:
  67        abort();
  68        break;
  69    }
  70    return 0;
  71}
  72
  73//#define MSI_DEBUG
  74
  75#ifdef MSI_DEBUG
  76# define MSI_DPRINTF(fmt, ...)                                          \
  77    fprintf(stderr, "%s:%d " fmt, __func__, __LINE__, ## __VA_ARGS__)
  78#else
  79# define MSI_DPRINTF(fmt, ...)  do { } while (0)
  80#endif
  81#define MSI_DEV_PRINTF(dev, fmt, ...)                                   \
  82    MSI_DPRINTF("%s:%x " fmt, (dev)->name, (dev)->devfn, ## __VA_ARGS__)
  83
  84static inline unsigned int msi_nr_vectors(uint16_t flags)
  85{
  86    return 1U <<
  87        ((flags & PCI_MSI_FLAGS_QSIZE) >> ctz32(PCI_MSI_FLAGS_QSIZE));
  88}
  89
  90static inline uint8_t msi_flags_off(const PCIDevice* dev)
  91{
  92    return dev->msi_cap + PCI_MSI_FLAGS;
  93}
  94
  95static inline uint8_t msi_address_lo_off(const PCIDevice* dev)
  96{
  97    return dev->msi_cap + PCI_MSI_ADDRESS_LO;
  98}
  99
 100static inline uint8_t msi_address_hi_off(const PCIDevice* dev)
 101{
 102    return dev->msi_cap + PCI_MSI_ADDRESS_HI;
 103}
 104
 105static inline uint8_t msi_data_off(const PCIDevice* dev, bool msi64bit)
 106{
 107    return dev->msi_cap + (msi64bit ? PCI_MSI_DATA_64 : PCI_MSI_DATA_32);
 108}
 109
 110static inline uint8_t msi_mask_off(const PCIDevice* dev, bool msi64bit)
 111{
 112    return dev->msi_cap + (msi64bit ? PCI_MSI_MASK_64 : PCI_MSI_MASK_32);
 113}
 114
 115static inline uint8_t msi_pending_off(const PCIDevice* dev, bool msi64bit)
 116{
 117    return dev->msi_cap + (msi64bit ? PCI_MSI_PENDING_64 : PCI_MSI_PENDING_32);
 118}
 119
 120/*
 121 * Special API for POWER to configure the vectors through
 122 * a side channel. Should never be used by devices.
 123 */
 124void msi_set_message(PCIDevice *dev, MSIMessage msg)
 125{
 126    uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
 127    bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
 128
 129    if (msi64bit) {
 130        pci_set_quad(dev->config + msi_address_lo_off(dev), msg.address);
 131    } else {
 132        pci_set_long(dev->config + msi_address_lo_off(dev), msg.address);
 133    }
 134    pci_set_word(dev->config + msi_data_off(dev, msi64bit), msg.data);
 135}
 136
 137static MSIMessage msi_prepare_message(PCIDevice *dev, unsigned int vector)
 138{
 139    uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
 140    bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
 141    unsigned int nr_vectors = msi_nr_vectors(flags);
 142    MSIMessage msg;
 143
 144    assert(vector < nr_vectors);
 145
 146    if (msi64bit) {
 147        msg.address = pci_get_quad(dev->config + msi_address_lo_off(dev));
 148    } else {
 149        msg.address = pci_get_long(dev->config + msi_address_lo_off(dev));
 150    }
 151
 152    /* upper bit 31:16 is zero */
 153    msg.data = pci_get_word(dev->config + msi_data_off(dev, msi64bit));
 154    if (nr_vectors > 1) {
 155        msg.data &= ~(nr_vectors - 1);
 156        msg.data |= vector;
 157    }
 158
 159    return msg;
 160}
 161
 162MSIMessage msi_get_message(PCIDevice *dev, unsigned int vector)
 163{
 164    return dev->msi_prepare_message(dev, vector);
 165}
 166
 167bool msi_enabled(const PCIDevice *dev)
 168{
 169    return msi_present(dev) &&
 170        (pci_get_word(dev->config + msi_flags_off(dev)) &
 171         PCI_MSI_FLAGS_ENABLE);
 172}
 173
 174/*
 175 * Make PCI device @dev MSI-capable.
 176 * Non-zero @offset puts capability MSI at that offset in PCI config
 177 * space.
 178 * @nr_vectors is the number of MSI vectors (1, 2, 4, 8, 16 or 32).
 179 * If @msi64bit, make the device capable of sending a 64-bit message
 180 * address.
 181 * If @msi_per_vector_mask, make the device support per-vector masking.
 182 * @errp is for returning errors.
 183 * Return 0 on success; set @errp and return -errno on error.
 184 *
 185 * -ENOTSUP means lacking msi support for a msi-capable platform.
 186 * -EINVAL means capability overlap, happens when @offset is non-zero,
 187 *  also means a programming error, except device assignment, which can check
 188 *  if a real HW is broken.
 189 */
 190int msi_init(struct PCIDevice *dev, uint8_t offset,
 191             unsigned int nr_vectors, bool msi64bit,
 192             bool msi_per_vector_mask, Error **errp)
 193{
 194    unsigned int vectors_order;
 195    uint16_t flags;
 196    uint8_t cap_size;
 197    int config_offset;
 198
 199    if (!msi_nonbroken) {
 200        error_setg(errp, "MSI is not supported by interrupt controller");
 201        return -ENOTSUP;
 202    }
 203
 204    MSI_DEV_PRINTF(dev,
 205                   "init offset: 0x%"PRIx8" vector: %"PRId8
 206                   " 64bit %d mask %d\n",
 207                   offset, nr_vectors, msi64bit, msi_per_vector_mask);
 208
 209    assert(!(nr_vectors & (nr_vectors - 1)));   /* power of 2 */
 210    assert(nr_vectors > 0);
 211    assert(nr_vectors <= PCI_MSI_VECTORS_MAX);
 212    /* the nr of MSI vectors is up to 32 */
 213    vectors_order = ctz32(nr_vectors);
 214
 215    flags = vectors_order << ctz32(PCI_MSI_FLAGS_QMASK);
 216    if (msi64bit) {
 217        flags |= PCI_MSI_FLAGS_64BIT;
 218    }
 219    if (msi_per_vector_mask) {
 220        flags |= PCI_MSI_FLAGS_MASKBIT;
 221    }
 222
 223    cap_size = msi_cap_sizeof(flags);
 224    config_offset = pci_add_capability(dev, PCI_CAP_ID_MSI, offset,
 225                                        cap_size, errp);
 226    if (config_offset < 0) {
 227        return config_offset;
 228    }
 229
 230    dev->msi_cap = config_offset;
 231    dev->cap_present |= QEMU_PCI_CAP_MSI;
 232
 233    pci_set_word(dev->config + msi_flags_off(dev), flags);
 234    pci_set_word(dev->wmask + msi_flags_off(dev),
 235                 PCI_MSI_FLAGS_QSIZE | PCI_MSI_FLAGS_ENABLE);
 236    pci_set_long(dev->wmask + msi_address_lo_off(dev),
 237                 PCI_MSI_ADDRESS_LO_MASK);
 238    if (msi64bit) {
 239        pci_set_long(dev->wmask + msi_address_hi_off(dev), 0xffffffff);
 240    }
 241    pci_set_word(dev->wmask + msi_data_off(dev, msi64bit), 0xffff);
 242
 243    if (msi_per_vector_mask) {
 244        /* Make mask bits 0 to nr_vectors - 1 writable. */
 245        pci_set_long(dev->wmask + msi_mask_off(dev, msi64bit),
 246                     0xffffffff >> (PCI_MSI_VECTORS_MAX - nr_vectors));
 247    }
 248
 249    dev->msi_prepare_message = msi_prepare_message;
 250
 251    return 0;
 252}
 253
 254void msi_uninit(struct PCIDevice *dev)
 255{
 256    uint16_t flags;
 257    uint8_t cap_size;
 258
 259    if (!msi_present(dev)) {
 260        return;
 261    }
 262    flags = pci_get_word(dev->config + msi_flags_off(dev));
 263    cap_size = msi_cap_sizeof(flags);
 264    pci_del_capability(dev, PCI_CAP_ID_MSI, cap_size);
 265    dev->cap_present &= ~QEMU_PCI_CAP_MSI;
 266    dev->msi_prepare_message = NULL;
 267
 268    MSI_DEV_PRINTF(dev, "uninit\n");
 269}
 270
 271void msi_reset(PCIDevice *dev)
 272{
 273    uint16_t flags;
 274    bool msi64bit;
 275
 276    if (!msi_present(dev)) {
 277        return;
 278    }
 279
 280    flags = pci_get_word(dev->config + msi_flags_off(dev));
 281    flags &= ~(PCI_MSI_FLAGS_QSIZE | PCI_MSI_FLAGS_ENABLE);
 282    msi64bit = flags & PCI_MSI_FLAGS_64BIT;
 283
 284    pci_set_word(dev->config + msi_flags_off(dev), flags);
 285    pci_set_long(dev->config + msi_address_lo_off(dev), 0);
 286    if (msi64bit) {
 287        pci_set_long(dev->config + msi_address_hi_off(dev), 0);
 288    }
 289    pci_set_word(dev->config + msi_data_off(dev, msi64bit), 0);
 290    if (flags & PCI_MSI_FLAGS_MASKBIT) {
 291        pci_set_long(dev->config + msi_mask_off(dev, msi64bit), 0);
 292        pci_set_long(dev->config + msi_pending_off(dev, msi64bit), 0);
 293    }
 294    MSI_DEV_PRINTF(dev, "reset\n");
 295}
 296
 297bool msi_is_masked(const PCIDevice *dev, unsigned int vector)
 298{
 299    uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
 300    uint32_t mask, data;
 301    bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
 302    assert(vector < PCI_MSI_VECTORS_MAX);
 303
 304    if (!(flags & PCI_MSI_FLAGS_MASKBIT)) {
 305        return false;
 306    }
 307
 308    data = pci_get_word(dev->config + msi_data_off(dev, msi64bit));
 309    if (xen_is_pirq_msi(data)) {
 310        return false;
 311    }
 312
 313    mask = pci_get_long(dev->config +
 314                        msi_mask_off(dev, flags & PCI_MSI_FLAGS_64BIT));
 315    return mask & (1U << vector);
 316}
 317
 318void msi_set_mask(PCIDevice *dev, int vector, bool mask, Error **errp)
 319{
 320    ERRP_GUARD();
 321    uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
 322    bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
 323    uint32_t irq_state, vector_mask, pending;
 324
 325    if (vector >= PCI_MSI_VECTORS_MAX) {
 326        error_setg(errp, "msi: vector %d not allocated. max vector is %d",
 327                   vector, (PCI_MSI_VECTORS_MAX - 1));
 328        return;
 329    }
 330
 331    vector_mask = (1U << vector);
 332
 333    irq_state = pci_get_long(dev->config + msi_mask_off(dev, msi64bit));
 334
 335    if (mask) {
 336        irq_state |= vector_mask;
 337    } else {
 338        irq_state &= ~vector_mask;
 339    }
 340
 341    pci_set_long(dev->config + msi_mask_off(dev, msi64bit), irq_state);
 342
 343    pending = pci_get_long(dev->config + msi_pending_off(dev, msi64bit));
 344    if (!mask && (pending & vector_mask)) {
 345        pending &= ~vector_mask;
 346        pci_set_long(dev->config + msi_pending_off(dev, msi64bit), pending);
 347        msi_notify(dev, vector);
 348    }
 349}
 350
 351void msi_notify(PCIDevice *dev, unsigned int vector)
 352{
 353    uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
 354    bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
 355    unsigned int nr_vectors = msi_nr_vectors(flags);
 356    MSIMessage msg;
 357
 358    assert(vector < nr_vectors);
 359    if (msi_is_masked(dev, vector)) {
 360        assert(flags & PCI_MSI_FLAGS_MASKBIT);
 361        pci_long_test_and_set_mask(
 362            dev->config + msi_pending_off(dev, msi64bit), 1U << vector);
 363        MSI_DEV_PRINTF(dev, "pending vector 0x%x\n", vector);
 364        return;
 365    }
 366
 367    msg = msi_get_message(dev, vector);
 368
 369    MSI_DEV_PRINTF(dev,
 370                   "notify vector 0x%x"
 371                   " address: 0x%"PRIx64" data: 0x%"PRIx32"\n",
 372                   vector, msg.address, msg.data);
 373    msi_send_message(dev, msg);
 374}
 375
 376void msi_send_message(PCIDevice *dev, MSIMessage msg)
 377{
 378    dev->msi_trigger(dev, msg);
 379}
 380
 381/* Normally called by pci_default_write_config(). */
 382void msi_write_config(PCIDevice *dev, uint32_t addr, uint32_t val, int len)
 383{
 384    uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
 385    bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
 386    bool msi_per_vector_mask = flags & PCI_MSI_FLAGS_MASKBIT;
 387    unsigned int nr_vectors;
 388    uint8_t log_num_vecs;
 389    uint8_t log_max_vecs;
 390    unsigned int vector;
 391    uint32_t pending;
 392
 393    if (!msi_present(dev) ||
 394        !ranges_overlap(addr, len, dev->msi_cap, msi_cap_sizeof(flags))) {
 395        return;
 396    }
 397
 398#ifdef MSI_DEBUG
 399    MSI_DEV_PRINTF(dev, "addr 0x%"PRIx32" val 0x%"PRIx32" len %d\n",
 400                   addr, val, len);
 401    MSI_DEV_PRINTF(dev, "ctrl: 0x%"PRIx16" address: 0x%"PRIx32,
 402                   flags,
 403                   pci_get_long(dev->config + msi_address_lo_off(dev)));
 404    if (msi64bit) {
 405        fprintf(stderr, " address-hi: 0x%"PRIx32,
 406                pci_get_long(dev->config + msi_address_hi_off(dev)));
 407    }
 408    fprintf(stderr, " data: 0x%"PRIx16,
 409            pci_get_word(dev->config + msi_data_off(dev, msi64bit)));
 410    if (flags & PCI_MSI_FLAGS_MASKBIT) {
 411        fprintf(stderr, " mask 0x%"PRIx32" pending 0x%"PRIx32,
 412                pci_get_long(dev->config + msi_mask_off(dev, msi64bit)),
 413                pci_get_long(dev->config + msi_pending_off(dev, msi64bit)));
 414    }
 415    fprintf(stderr, "\n");
 416#endif
 417
 418    if (!(flags & PCI_MSI_FLAGS_ENABLE)) {
 419        return;
 420    }
 421
 422    /*
 423     * Now MSI is enabled, clear INTx# interrupts.
 424     * the driver is prohibited from writing enable bit to mask
 425     * a service request. But the guest OS could do this.
 426     * So we just discard the interrupts as moderate fallback.
 427     *
 428     * 6.8.3.3. Enabling Operation
 429     *   While enabled for MSI or MSI-X operation, a function is prohibited
 430     *   from using its INTx# pin (if implemented) to request
 431     *   service (MSI, MSI-X, and INTx# are mutually exclusive).
 432     */
 433    pci_device_deassert_intx(dev);
 434
 435    /*
 436     * nr_vectors might be set bigger than capable. So clamp it.
 437     * This is not legal by spec, so we can do anything we like,
 438     * just don't crash the host
 439     */
 440    log_num_vecs =
 441        (flags & PCI_MSI_FLAGS_QSIZE) >> ctz32(PCI_MSI_FLAGS_QSIZE);
 442    log_max_vecs =
 443        (flags & PCI_MSI_FLAGS_QMASK) >> ctz32(PCI_MSI_FLAGS_QMASK);
 444    if (log_num_vecs > log_max_vecs) {
 445        flags &= ~PCI_MSI_FLAGS_QSIZE;
 446        flags |= log_max_vecs << ctz32(PCI_MSI_FLAGS_QSIZE);
 447        pci_set_word(dev->config + msi_flags_off(dev), flags);
 448    }
 449
 450    if (!msi_per_vector_mask) {
 451        /* if per vector masking isn't supported,
 452           there is no pending interrupt. */
 453        return;
 454    }
 455
 456    nr_vectors = msi_nr_vectors(flags);
 457
 458    /* This will discard pending interrupts, if any. */
 459    pending = pci_get_long(dev->config + msi_pending_off(dev, msi64bit));
 460    pending &= 0xffffffff >> (PCI_MSI_VECTORS_MAX - nr_vectors);
 461    pci_set_long(dev->config + msi_pending_off(dev, msi64bit), pending);
 462
 463    /* deliver pending interrupts which are unmasked */
 464    for (vector = 0; vector < nr_vectors; ++vector) {
 465        if (msi_is_masked(dev, vector) || !(pending & (1U << vector))) {
 466            continue;
 467        }
 468
 469        pci_long_test_and_clear_mask(
 470            dev->config + msi_pending_off(dev, msi64bit), 1U << vector);
 471        msi_notify(dev, vector);
 472    }
 473}
 474
 475unsigned int msi_nr_vectors_allocated(const PCIDevice *dev)
 476{
 477    uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
 478    return msi_nr_vectors(flags);
 479}
 480