qemu/hw/s390x/s390-pci-bus.c
<<
>>
Prefs
   1/*
   2 * s390 PCI BUS
   3 *
   4 * Copyright 2014 IBM Corp.
   5 * Author(s): Frank Blaschka <frank.blaschka@de.ibm.com>
   6 *            Hong Bo Li <lihbbj@cn.ibm.com>
   7 *            Yi Min Zhao <zyimin@cn.ibm.com>
   8 *
   9 * This work is licensed under the terms of the GNU GPL, version 2 or (at
  10 * your option) any later version. See the COPYING file in the top-level
  11 * directory.
  12 */
  13
  14#include "qemu/osdep.h"
  15#include "qapi/error.h"
  16#include "qapi/visitor.h"
  17#include "hw/s390x/s390-pci-bus.h"
  18#include "hw/s390x/s390-pci-inst.h"
  19#include "hw/s390x/s390-pci-kvm.h"
  20#include "hw/s390x/s390-pci-vfio.h"
  21#include "hw/pci/pci_bus.h"
  22#include "hw/qdev-properties.h"
  23#include "hw/pci/pci_bridge.h"
  24#include "hw/pci/msi.h"
  25#include "qemu/error-report.h"
  26#include "qemu/module.h"
  27#include "sysemu/reset.h"
  28#include "sysemu/runstate.h"
  29
  30#ifndef DEBUG_S390PCI_BUS
  31#define DEBUG_S390PCI_BUS  0
  32#endif
  33
  34#define DPRINTF(fmt, ...)                                         \
  35    do {                                                          \
  36        if (DEBUG_S390PCI_BUS) {                                  \
  37            fprintf(stderr, "S390pci-bus: " fmt, ## __VA_ARGS__); \
  38        }                                                         \
  39    } while (0)
  40
  41S390pciState *s390_get_phb(void)
  42{
  43    static S390pciState *phb;
  44
  45    if (!phb) {
  46        phb = S390_PCI_HOST_BRIDGE(
  47            object_resolve_path(TYPE_S390_PCI_HOST_BRIDGE, NULL));
  48        assert(phb != NULL);
  49    }
  50
  51    return phb;
  52}
  53
  54int pci_chsc_sei_nt2_get_event(void *res)
  55{
  56    ChscSeiNt2Res *nt2_res = (ChscSeiNt2Res *)res;
  57    PciCcdfAvail *accdf;
  58    PciCcdfErr *eccdf;
  59    int rc = 1;
  60    SeiContainer *sei_cont;
  61    S390pciState *s = s390_get_phb();
  62
  63    sei_cont = QTAILQ_FIRST(&s->pending_sei);
  64    if (sei_cont) {
  65        QTAILQ_REMOVE(&s->pending_sei, sei_cont, link);
  66        nt2_res->nt = 2;
  67        nt2_res->cc = sei_cont->cc;
  68        nt2_res->length = cpu_to_be16(sizeof(ChscSeiNt2Res));
  69        switch (sei_cont->cc) {
  70        case 1: /* error event */
  71            eccdf = (PciCcdfErr *)nt2_res->ccdf;
  72            eccdf->fid = cpu_to_be32(sei_cont->fid);
  73            eccdf->fh = cpu_to_be32(sei_cont->fh);
  74            eccdf->e = cpu_to_be32(sei_cont->e);
  75            eccdf->faddr = cpu_to_be64(sei_cont->faddr);
  76            eccdf->pec = cpu_to_be16(sei_cont->pec);
  77            break;
  78        case 2: /* availability event */
  79            accdf = (PciCcdfAvail *)nt2_res->ccdf;
  80            accdf->fid = cpu_to_be32(sei_cont->fid);
  81            accdf->fh = cpu_to_be32(sei_cont->fh);
  82            accdf->pec = cpu_to_be16(sei_cont->pec);
  83            break;
  84        default:
  85            abort();
  86        }
  87        g_free(sei_cont);
  88        rc = 0;
  89    }
  90
  91    return rc;
  92}
  93
  94int pci_chsc_sei_nt2_have_event(void)
  95{
  96    S390pciState *s = s390_get_phb();
  97
  98    return !QTAILQ_EMPTY(&s->pending_sei);
  99}
 100
 101S390PCIBusDevice *s390_pci_find_next_avail_dev(S390pciState *s,
 102                                               S390PCIBusDevice *pbdev)
 103{
 104    S390PCIBusDevice *ret = pbdev ? QTAILQ_NEXT(pbdev, link) :
 105        QTAILQ_FIRST(&s->zpci_devs);
 106
 107    while (ret && ret->state == ZPCI_FS_RESERVED) {
 108        ret = QTAILQ_NEXT(ret, link);
 109    }
 110
 111    return ret;
 112}
 113
 114S390PCIBusDevice *s390_pci_find_dev_by_fid(S390pciState *s, uint32_t fid)
 115{
 116    S390PCIBusDevice *pbdev;
 117
 118    QTAILQ_FOREACH(pbdev, &s->zpci_devs, link) {
 119        if (pbdev->fid == fid) {
 120            return pbdev;
 121        }
 122    }
 123
 124    return NULL;
 125}
 126
 127void s390_pci_sclp_configure(SCCB *sccb)
 128{
 129    IoaCfgSccb *psccb = (IoaCfgSccb *)sccb;
 130    S390PCIBusDevice *pbdev = s390_pci_find_dev_by_fid(s390_get_phb(),
 131                                                       be32_to_cpu(psccb->aid));
 132    uint16_t rc;
 133
 134    if (!pbdev) {
 135        DPRINTF("sclp config no dev found\n");
 136        rc = SCLP_RC_ADAPTER_ID_NOT_RECOGNIZED;
 137        goto out;
 138    }
 139
 140    switch (pbdev->state) {
 141    case ZPCI_FS_RESERVED:
 142        rc = SCLP_RC_ADAPTER_IN_RESERVED_STATE;
 143        break;
 144    case ZPCI_FS_STANDBY:
 145        pbdev->state = ZPCI_FS_DISABLED;
 146        rc = SCLP_RC_NORMAL_COMPLETION;
 147        break;
 148    default:
 149        rc = SCLP_RC_NO_ACTION_REQUIRED;
 150    }
 151out:
 152    psccb->header.response_code = cpu_to_be16(rc);
 153}
 154
 155static void s390_pci_shutdown_notifier(Notifier *n, void *opaque)
 156{
 157    S390PCIBusDevice *pbdev = container_of(n, S390PCIBusDevice,
 158                                           shutdown_notifier);
 159
 160    pci_device_reset(pbdev->pdev);
 161}
 162
 163static void s390_pci_reset_cb(void *opaque)
 164{
 165    S390PCIBusDevice *pbdev = opaque;
 166
 167    pci_device_reset(pbdev->pdev);
 168}
 169
 170static void s390_pci_perform_unplug(S390PCIBusDevice *pbdev)
 171{
 172    HotplugHandler *hotplug_ctrl;
 173
 174    if (pbdev->pft == ZPCI_PFT_ISM) {
 175        notifier_remove(&pbdev->shutdown_notifier);
 176        qemu_unregister_reset(s390_pci_reset_cb, pbdev);
 177    }
 178
 179    /* Unplug the PCI device */
 180    if (pbdev->pdev) {
 181        DeviceState *pdev = DEVICE(pbdev->pdev);
 182
 183        hotplug_ctrl = qdev_get_hotplug_handler(pdev);
 184        hotplug_handler_unplug(hotplug_ctrl, pdev, &error_abort);
 185        object_unparent(OBJECT(pdev));
 186    }
 187
 188    /* Unplug the zPCI device */
 189    hotplug_ctrl = qdev_get_hotplug_handler(DEVICE(pbdev));
 190    hotplug_handler_unplug(hotplug_ctrl, DEVICE(pbdev), &error_abort);
 191    object_unparent(OBJECT(pbdev));
 192}
 193
 194void s390_pci_sclp_deconfigure(SCCB *sccb)
 195{
 196    IoaCfgSccb *psccb = (IoaCfgSccb *)sccb;
 197    S390PCIBusDevice *pbdev = s390_pci_find_dev_by_fid(s390_get_phb(),
 198                                                       be32_to_cpu(psccb->aid));
 199    uint16_t rc;
 200
 201    if (!pbdev) {
 202        DPRINTF("sclp deconfig no dev found\n");
 203        rc = SCLP_RC_ADAPTER_ID_NOT_RECOGNIZED;
 204        goto out;
 205    }
 206
 207    switch (pbdev->state) {
 208    case ZPCI_FS_RESERVED:
 209        rc = SCLP_RC_ADAPTER_IN_RESERVED_STATE;
 210        break;
 211    case ZPCI_FS_STANDBY:
 212        rc = SCLP_RC_NO_ACTION_REQUIRED;
 213        break;
 214    default:
 215        if (pbdev->interp && (pbdev->fh & FH_MASK_ENABLE)) {
 216            /* Interpreted devices were using interrupt forwarding */
 217            s390_pci_kvm_aif_disable(pbdev);
 218        } else if (pbdev->summary_ind) {
 219            pci_dereg_irqs(pbdev);
 220        }
 221        if (pbdev->iommu->enabled) {
 222            pci_dereg_ioat(pbdev->iommu);
 223        }
 224        pbdev->state = ZPCI_FS_STANDBY;
 225        rc = SCLP_RC_NORMAL_COMPLETION;
 226
 227        if (pbdev->unplug_requested) {
 228            s390_pci_perform_unplug(pbdev);
 229        }
 230    }
 231out:
 232    psccb->header.response_code = cpu_to_be16(rc);
 233}
 234
 235static S390PCIBusDevice *s390_pci_find_dev_by_uid(S390pciState *s, uint16_t uid)
 236{
 237    S390PCIBusDevice *pbdev;
 238
 239    QTAILQ_FOREACH(pbdev, &s->zpci_devs, link) {
 240        if (pbdev->uid == uid) {
 241            return pbdev;
 242        }
 243    }
 244
 245    return NULL;
 246}
 247
 248S390PCIBusDevice *s390_pci_find_dev_by_target(S390pciState *s,
 249                                              const char *target)
 250{
 251    S390PCIBusDevice *pbdev;
 252
 253    if (!target) {
 254        return NULL;
 255    }
 256
 257    QTAILQ_FOREACH(pbdev, &s->zpci_devs, link) {
 258        if (!strcmp(pbdev->target, target)) {
 259            return pbdev;
 260        }
 261    }
 262
 263    return NULL;
 264}
 265
 266static S390PCIBusDevice *s390_pci_find_dev_by_pci(S390pciState *s,
 267                                                  PCIDevice *pci_dev)
 268{
 269    S390PCIBusDevice *pbdev;
 270
 271    if (!pci_dev) {
 272        return NULL;
 273    }
 274
 275    QTAILQ_FOREACH(pbdev, &s->zpci_devs, link) {
 276        if (pbdev->pdev == pci_dev) {
 277            return pbdev;
 278        }
 279    }
 280
 281    return NULL;
 282}
 283
 284S390PCIBusDevice *s390_pci_find_dev_by_idx(S390pciState *s, uint32_t idx)
 285{
 286    return g_hash_table_lookup(s->zpci_table, &idx);
 287}
 288
 289S390PCIBusDevice *s390_pci_find_dev_by_fh(S390pciState *s, uint32_t fh)
 290{
 291    uint32_t idx = FH_MASK_INDEX & fh;
 292    S390PCIBusDevice *pbdev = s390_pci_find_dev_by_idx(s, idx);
 293
 294    if (pbdev && pbdev->fh == fh) {
 295        return pbdev;
 296    }
 297
 298    return NULL;
 299}
 300
 301static void s390_pci_generate_event(uint8_t cc, uint16_t pec, uint32_t fh,
 302                                    uint32_t fid, uint64_t faddr, uint32_t e)
 303{
 304    SeiContainer *sei_cont;
 305    S390pciState *s = s390_get_phb();
 306
 307    sei_cont = g_new0(SeiContainer, 1);
 308    sei_cont->fh = fh;
 309    sei_cont->fid = fid;
 310    sei_cont->cc = cc;
 311    sei_cont->pec = pec;
 312    sei_cont->faddr = faddr;
 313    sei_cont->e = e;
 314
 315    QTAILQ_INSERT_TAIL(&s->pending_sei, sei_cont, link);
 316    css_generate_css_crws(0);
 317}
 318
 319static void s390_pci_generate_plug_event(uint16_t pec, uint32_t fh,
 320                                         uint32_t fid)
 321{
 322    s390_pci_generate_event(2, pec, fh, fid, 0, 0);
 323}
 324
 325void s390_pci_generate_error_event(uint16_t pec, uint32_t fh, uint32_t fid,
 326                                   uint64_t faddr, uint32_t e)
 327{
 328    s390_pci_generate_event(1, pec, fh, fid, faddr, e);
 329}
 330
 331static void s390_pci_set_irq(void *opaque, int irq, int level)
 332{
 333    /* nothing to do */
 334}
 335
 336static int s390_pci_map_irq(PCIDevice *pci_dev, int irq_num)
 337{
 338    /* nothing to do */
 339    return 0;
 340}
 341
 342static uint64_t s390_pci_get_table_origin(uint64_t iota)
 343{
 344    return iota & ~ZPCI_IOTA_RTTO_FLAG;
 345}
 346
 347static unsigned int calc_rtx(dma_addr_t ptr)
 348{
 349    return ((unsigned long) ptr >> ZPCI_RT_SHIFT) & ZPCI_INDEX_MASK;
 350}
 351
 352static unsigned int calc_sx(dma_addr_t ptr)
 353{
 354    return ((unsigned long) ptr >> ZPCI_ST_SHIFT) & ZPCI_INDEX_MASK;
 355}
 356
 357static unsigned int calc_px(dma_addr_t ptr)
 358{
 359    return ((unsigned long) ptr >> TARGET_PAGE_BITS) & ZPCI_PT_MASK;
 360}
 361
 362static uint64_t get_rt_sto(uint64_t entry)
 363{
 364    return ((entry & ZPCI_TABLE_TYPE_MASK) == ZPCI_TABLE_TYPE_RTX)
 365                ? (entry & ZPCI_RTE_ADDR_MASK)
 366                : 0;
 367}
 368
 369static uint64_t get_st_pto(uint64_t entry)
 370{
 371    return ((entry & ZPCI_TABLE_TYPE_MASK) == ZPCI_TABLE_TYPE_SX)
 372            ? (entry & ZPCI_STE_ADDR_MASK)
 373            : 0;
 374}
 375
 376static bool rt_entry_isvalid(uint64_t entry)
 377{
 378    return (entry & ZPCI_TABLE_VALID_MASK) == ZPCI_TABLE_VALID;
 379}
 380
 381static bool pt_entry_isvalid(uint64_t entry)
 382{
 383    return (entry & ZPCI_PTE_VALID_MASK) == ZPCI_PTE_VALID;
 384}
 385
 386static bool entry_isprotected(uint64_t entry)
 387{
 388    return (entry & ZPCI_TABLE_PROT_MASK) == ZPCI_TABLE_PROTECTED;
 389}
 390
 391/* ett is expected table type, -1 page table, 0 segment table, 1 region table */
 392static uint64_t get_table_index(uint64_t iova, int8_t ett)
 393{
 394    switch (ett) {
 395    case ZPCI_ETT_PT:
 396        return calc_px(iova);
 397    case ZPCI_ETT_ST:
 398        return calc_sx(iova);
 399    case ZPCI_ETT_RT:
 400        return calc_rtx(iova);
 401    }
 402
 403    return -1;
 404}
 405
 406static bool entry_isvalid(uint64_t entry, int8_t ett)
 407{
 408    switch (ett) {
 409    case ZPCI_ETT_PT:
 410        return pt_entry_isvalid(entry);
 411    case ZPCI_ETT_ST:
 412    case ZPCI_ETT_RT:
 413        return rt_entry_isvalid(entry);
 414    }
 415
 416    return false;
 417}
 418
 419/* Return true if address translation is done */
 420static bool translate_iscomplete(uint64_t entry, int8_t ett)
 421{
 422    switch (ett) {
 423    case 0:
 424        return (entry & ZPCI_TABLE_FC) ? true : false;
 425    case 1:
 426        return false;
 427    }
 428
 429    return true;
 430}
 431
 432static uint64_t get_frame_size(int8_t ett)
 433{
 434    switch (ett) {
 435    case ZPCI_ETT_PT:
 436        return 1ULL << 12;
 437    case ZPCI_ETT_ST:
 438        return 1ULL << 20;
 439    case ZPCI_ETT_RT:
 440        return 1ULL << 31;
 441    }
 442
 443    return 0;
 444}
 445
 446static uint64_t get_next_table_origin(uint64_t entry, int8_t ett)
 447{
 448    switch (ett) {
 449    case ZPCI_ETT_PT:
 450        return entry & ZPCI_PTE_ADDR_MASK;
 451    case ZPCI_ETT_ST:
 452        return get_st_pto(entry);
 453    case ZPCI_ETT_RT:
 454        return get_rt_sto(entry);
 455    }
 456
 457    return 0;
 458}
 459
 460/**
 461 * table_translate: do translation within one table and return the following
 462 *                  table origin
 463 *
 464 * @entry: the entry being translated, the result is stored in this.
 465 * @to: the address of table origin.
 466 * @ett: expected table type, 1 region table, 0 segment table and -1 page table.
 467 * @error: error code
 468 */
 469static uint64_t table_translate(S390IOTLBEntry *entry, uint64_t to, int8_t ett,
 470                                uint16_t *error)
 471{
 472    uint64_t tx, te, nto = 0;
 473    uint16_t err = 0;
 474
 475    tx = get_table_index(entry->iova, ett);
 476    te = address_space_ldq(&address_space_memory, to + tx * sizeof(uint64_t),
 477                           MEMTXATTRS_UNSPECIFIED, NULL);
 478
 479    if (!te) {
 480        err = ERR_EVENT_INVALTE;
 481        goto out;
 482    }
 483
 484    if (!entry_isvalid(te, ett)) {
 485        entry->perm &= IOMMU_NONE;
 486        goto out;
 487    }
 488
 489    if (ett == ZPCI_ETT_RT && ((te & ZPCI_TABLE_LEN_RTX) != ZPCI_TABLE_LEN_RTX
 490                               || te & ZPCI_TABLE_OFFSET_MASK)) {
 491        err = ERR_EVENT_INVALTL;
 492        goto out;
 493    }
 494
 495    nto = get_next_table_origin(te, ett);
 496    if (!nto) {
 497        err = ERR_EVENT_TT;
 498        goto out;
 499    }
 500
 501    if (entry_isprotected(te)) {
 502        entry->perm &= IOMMU_RO;
 503    } else {
 504        entry->perm &= IOMMU_RW;
 505    }
 506
 507    if (translate_iscomplete(te, ett)) {
 508        switch (ett) {
 509        case ZPCI_ETT_PT:
 510            entry->translated_addr = te & ZPCI_PTE_ADDR_MASK;
 511            break;
 512        case ZPCI_ETT_ST:
 513            entry->translated_addr = (te & ZPCI_SFAA_MASK) |
 514                (entry->iova & ~ZPCI_SFAA_MASK);
 515            break;
 516        }
 517        nto = 0;
 518    }
 519out:
 520    if (err) {
 521        entry->perm = IOMMU_NONE;
 522        *error = err;
 523    }
 524    entry->len = get_frame_size(ett);
 525    return nto;
 526}
 527
 528uint16_t s390_guest_io_table_walk(uint64_t g_iota, hwaddr addr,
 529                                  S390IOTLBEntry *entry)
 530{
 531    uint64_t to = s390_pci_get_table_origin(g_iota);
 532    int8_t ett = 1;
 533    uint16_t error = 0;
 534
 535    entry->iova = addr & TARGET_PAGE_MASK;
 536    entry->translated_addr = 0;
 537    entry->perm = IOMMU_RW;
 538
 539    if (entry_isprotected(g_iota)) {
 540        entry->perm &= IOMMU_RO;
 541    }
 542
 543    while (to) {
 544        to = table_translate(entry, to, ett--, &error);
 545    }
 546
 547    return error;
 548}
 549
 550static IOMMUTLBEntry s390_translate_iommu(IOMMUMemoryRegion *mr, hwaddr addr,
 551                                          IOMMUAccessFlags flag, int iommu_idx)
 552{
 553    S390PCIIOMMU *iommu = container_of(mr, S390PCIIOMMU, iommu_mr);
 554    S390IOTLBEntry *entry;
 555    uint64_t iova = addr & TARGET_PAGE_MASK;
 556    uint16_t error = 0;
 557    IOMMUTLBEntry ret = {
 558        .target_as = &address_space_memory,
 559        .iova = 0,
 560        .translated_addr = 0,
 561        .addr_mask = ~(hwaddr)0,
 562        .perm = IOMMU_NONE,
 563    };
 564
 565    switch (iommu->pbdev->state) {
 566    case ZPCI_FS_ENABLED:
 567    case ZPCI_FS_BLOCKED:
 568        if (!iommu->enabled) {
 569            return ret;
 570        }
 571        break;
 572    default:
 573        return ret;
 574    }
 575
 576    DPRINTF("iommu trans addr 0x%" PRIx64 "\n", addr);
 577
 578    if (addr < iommu->pba || addr > iommu->pal) {
 579        error = ERR_EVENT_OORANGE;
 580        goto err;
 581    }
 582
 583    entry = g_hash_table_lookup(iommu->iotlb, &iova);
 584    if (entry) {
 585        ret.iova = entry->iova;
 586        ret.translated_addr = entry->translated_addr;
 587        ret.addr_mask = entry->len - 1;
 588        ret.perm = entry->perm;
 589    } else {
 590        ret.iova = iova;
 591        ret.addr_mask = ~TARGET_PAGE_MASK;
 592        ret.perm = IOMMU_NONE;
 593    }
 594
 595    if (flag != IOMMU_NONE && !(flag & ret.perm)) {
 596        error = ERR_EVENT_TPROTE;
 597    }
 598err:
 599    if (error) {
 600        iommu->pbdev->state = ZPCI_FS_ERROR;
 601        s390_pci_generate_error_event(error, iommu->pbdev->fh,
 602                                      iommu->pbdev->fid, addr, 0);
 603    }
 604    return ret;
 605}
 606
 607static void s390_pci_iommu_replay(IOMMUMemoryRegion *iommu,
 608                                  IOMMUNotifier *notifier)
 609{
 610    /* It's impossible to plug a pci device on s390x that already has iommu
 611     * mappings which need to be replayed, that is due to the "one iommu per
 612     * zpci device" construct. But when we support migration of vfio-pci
 613     * devices in future, we need to revisit this.
 614     */
 615    return;
 616}
 617
 618static S390PCIIOMMU *s390_pci_get_iommu(S390pciState *s, PCIBus *bus,
 619                                        int devfn)
 620{
 621    uint64_t key = (uintptr_t)bus;
 622    S390PCIIOMMUTable *table = g_hash_table_lookup(s->iommu_table, &key);
 623    S390PCIIOMMU *iommu;
 624
 625    if (!table) {
 626        table = g_new0(S390PCIIOMMUTable, 1);
 627        table->key = key;
 628        g_hash_table_insert(s->iommu_table, &table->key, table);
 629    }
 630
 631    iommu = table->iommu[PCI_SLOT(devfn)];
 632    if (!iommu) {
 633        iommu = S390_PCI_IOMMU(object_new(TYPE_S390_PCI_IOMMU));
 634
 635        char *mr_name = g_strdup_printf("iommu-root-%02x:%02x.%01x",
 636                                        pci_bus_num(bus),
 637                                        PCI_SLOT(devfn),
 638                                        PCI_FUNC(devfn));
 639        char *as_name = g_strdup_printf("iommu-pci-%02x:%02x.%01x",
 640                                        pci_bus_num(bus),
 641                                        PCI_SLOT(devfn),
 642                                        PCI_FUNC(devfn));
 643        memory_region_init(&iommu->mr, OBJECT(iommu), mr_name, UINT64_MAX);
 644        address_space_init(&iommu->as, &iommu->mr, as_name);
 645        iommu->iotlb = g_hash_table_new_full(g_int64_hash, g_int64_equal,
 646                                             NULL, g_free);
 647        table->iommu[PCI_SLOT(devfn)] = iommu;
 648
 649        g_free(mr_name);
 650        g_free(as_name);
 651    }
 652
 653    return iommu;
 654}
 655
 656static AddressSpace *s390_pci_dma_iommu(PCIBus *bus, void *opaque, int devfn)
 657{
 658    S390pciState *s = opaque;
 659    S390PCIIOMMU *iommu = s390_pci_get_iommu(s, bus, devfn);
 660
 661    return &iommu->as;
 662}
 663
 664static uint8_t set_ind_atomic(uint64_t ind_loc, uint8_t to_be_set)
 665{
 666    uint8_t expected, actual;
 667    hwaddr len = 1;
 668    /* avoid  multiple fetches */
 669    uint8_t volatile *ind_addr;
 670
 671    ind_addr = cpu_physical_memory_map(ind_loc, &len, true);
 672    if (!ind_addr) {
 673        s390_pci_generate_error_event(ERR_EVENT_AIRERR, 0, 0, 0, 0);
 674        return -1;
 675    }
 676    actual = *ind_addr;
 677    do {
 678        expected = actual;
 679        actual = qatomic_cmpxchg(ind_addr, expected, expected | to_be_set);
 680    } while (actual != expected);
 681    cpu_physical_memory_unmap((void *)ind_addr, len, 1, len);
 682
 683    return actual;
 684}
 685
 686static void s390_msi_ctrl_write(void *opaque, hwaddr addr, uint64_t data,
 687                                unsigned int size)
 688{
 689    S390PCIBusDevice *pbdev = opaque;
 690    uint32_t vec = data & ZPCI_MSI_VEC_MASK;
 691    uint64_t ind_bit;
 692    uint32_t sum_bit;
 693
 694    assert(pbdev);
 695    DPRINTF("write_msix data 0x%" PRIx64 " idx %d vec 0x%x\n", data,
 696            pbdev->idx, vec);
 697
 698    if (pbdev->state != ZPCI_FS_ENABLED) {
 699        return;
 700    }
 701
 702    ind_bit = pbdev->routes.adapter.ind_offset;
 703    sum_bit = pbdev->routes.adapter.summary_offset;
 704
 705    set_ind_atomic(pbdev->routes.adapter.ind_addr + (ind_bit + vec) / 8,
 706                   0x80 >> ((ind_bit + vec) % 8));
 707    if (!set_ind_atomic(pbdev->routes.adapter.summary_addr + sum_bit / 8,
 708                                       0x80 >> (sum_bit % 8))) {
 709        css_adapter_interrupt(CSS_IO_ADAPTER_PCI, pbdev->isc);
 710    }
 711}
 712
 713static uint64_t s390_msi_ctrl_read(void *opaque, hwaddr addr, unsigned size)
 714{
 715    return 0xffffffff;
 716}
 717
 718static const MemoryRegionOps s390_msi_ctrl_ops = {
 719    .write = s390_msi_ctrl_write,
 720    .read = s390_msi_ctrl_read,
 721    .endianness = DEVICE_LITTLE_ENDIAN,
 722};
 723
 724void s390_pci_iommu_enable(S390PCIIOMMU *iommu)
 725{
 726    /*
 727     * The iommu region is initialized against a 0-mapped address space,
 728     * so the smallest IOMMU region we can define runs from 0 to the end
 729     * of the PCI address space.
 730     */
 731    char *name = g_strdup_printf("iommu-s390-%04x", iommu->pbdev->uid);
 732    memory_region_init_iommu(&iommu->iommu_mr, sizeof(iommu->iommu_mr),
 733                             TYPE_S390_IOMMU_MEMORY_REGION, OBJECT(&iommu->mr),
 734                             name, iommu->pal + 1);
 735    iommu->enabled = true;
 736    memory_region_add_subregion(&iommu->mr, 0, MEMORY_REGION(&iommu->iommu_mr));
 737    g_free(name);
 738}
 739
 740void s390_pci_iommu_disable(S390PCIIOMMU *iommu)
 741{
 742    iommu->enabled = false;
 743    g_hash_table_remove_all(iommu->iotlb);
 744    memory_region_del_subregion(&iommu->mr, MEMORY_REGION(&iommu->iommu_mr));
 745    object_unparent(OBJECT(&iommu->iommu_mr));
 746}
 747
 748static void s390_pci_iommu_free(S390pciState *s, PCIBus *bus, int32_t devfn)
 749{
 750    uint64_t key = (uintptr_t)bus;
 751    S390PCIIOMMUTable *table = g_hash_table_lookup(s->iommu_table, &key);
 752    S390PCIIOMMU *iommu = table ? table->iommu[PCI_SLOT(devfn)] : NULL;
 753
 754    if (!table || !iommu) {
 755        return;
 756    }
 757
 758    table->iommu[PCI_SLOT(devfn)] = NULL;
 759    g_hash_table_destroy(iommu->iotlb);
 760    /*
 761     * An attached PCI device may have memory listeners, eg. VFIO PCI.
 762     * The associated subregion will already have been unmapped in
 763     * s390_pci_iommu_disable in response to the guest deconfigure request.
 764     * Remove the listeners now before destroying the address space.
 765     */
 766    address_space_remove_listeners(&iommu->as);
 767    address_space_destroy(&iommu->as);
 768    object_unparent(OBJECT(&iommu->mr));
 769    object_unparent(OBJECT(iommu));
 770    object_unref(OBJECT(iommu));
 771}
 772
 773S390PCIGroup *s390_group_create(int id, int host_id)
 774{
 775    S390PCIGroup *group;
 776    S390pciState *s = s390_get_phb();
 777
 778    group = g_new0(S390PCIGroup, 1);
 779    group->id = id;
 780    group->host_id = host_id;
 781    QTAILQ_INSERT_TAIL(&s->zpci_groups, group, link);
 782    return group;
 783}
 784
 785S390PCIGroup *s390_group_find(int id)
 786{
 787    S390PCIGroup *group;
 788    S390pciState *s = s390_get_phb();
 789
 790    QTAILQ_FOREACH(group, &s->zpci_groups, link) {
 791        if (group->id == id) {
 792            return group;
 793        }
 794    }
 795    return NULL;
 796}
 797
 798S390PCIGroup *s390_group_find_host_sim(int host_id)
 799{
 800    S390PCIGroup *group;
 801    S390pciState *s = s390_get_phb();
 802
 803    QTAILQ_FOREACH(group, &s->zpci_groups, link) {
 804        if (group->id >= ZPCI_SIM_GRP_START && group->host_id == host_id) {
 805            return group;
 806        }
 807    }
 808    return NULL;
 809}
 810
 811static void s390_pci_init_default_group(void)
 812{
 813    S390PCIGroup *group;
 814    ClpRspQueryPciGrp *resgrp;
 815
 816    group = s390_group_create(ZPCI_DEFAULT_FN_GRP, ZPCI_DEFAULT_FN_GRP);
 817    resgrp = &group->zpci_group;
 818    resgrp->fr = 1;
 819    resgrp->dasm = 0;
 820    resgrp->msia = ZPCI_MSI_ADDR;
 821    resgrp->mui = DEFAULT_MUI;
 822    resgrp->i = 128;
 823    resgrp->maxstbl = 128;
 824    resgrp->version = 0;
 825    resgrp->dtsm = ZPCI_DTSM;
 826}
 827
 828static void set_pbdev_info(S390PCIBusDevice *pbdev)
 829{
 830    pbdev->zpci_fn.sdma = ZPCI_SDMA_ADDR;
 831    pbdev->zpci_fn.edma = ZPCI_EDMA_ADDR;
 832    pbdev->zpci_fn.pchid = 0;
 833    pbdev->zpci_fn.pfgid = ZPCI_DEFAULT_FN_GRP;
 834    pbdev->zpci_fn.fid = pbdev->fid;
 835    pbdev->zpci_fn.uid = pbdev->uid;
 836    pbdev->pci_group = s390_group_find(ZPCI_DEFAULT_FN_GRP);
 837}
 838
 839static void s390_pcihost_realize(DeviceState *dev, Error **errp)
 840{
 841    PCIBus *b;
 842    BusState *bus;
 843    PCIHostState *phb = PCI_HOST_BRIDGE(dev);
 844    S390pciState *s = S390_PCI_HOST_BRIDGE(dev);
 845
 846    DPRINTF("host_init\n");
 847
 848    b = pci_register_root_bus(dev, NULL, s390_pci_set_irq, s390_pci_map_irq,
 849                              NULL, get_system_memory(), get_system_io(), 0,
 850                              64, TYPE_PCI_BUS);
 851    pci_setup_iommu(b, s390_pci_dma_iommu, s);
 852
 853    bus = BUS(b);
 854    qbus_set_hotplug_handler(bus, OBJECT(dev));
 855    phb->bus = b;
 856
 857    s->bus = S390_PCI_BUS(qbus_new(TYPE_S390_PCI_BUS, dev, NULL));
 858    qbus_set_hotplug_handler(BUS(s->bus), OBJECT(dev));
 859
 860    s->iommu_table = g_hash_table_new_full(g_int64_hash, g_int64_equal,
 861                                           NULL, g_free);
 862    s->zpci_table = g_hash_table_new_full(g_int_hash, g_int_equal, NULL, NULL);
 863    s->bus_no = 0;
 864    s->next_sim_grp = ZPCI_SIM_GRP_START;
 865    QTAILQ_INIT(&s->pending_sei);
 866    QTAILQ_INIT(&s->zpci_devs);
 867    QTAILQ_INIT(&s->zpci_dma_limit);
 868    QTAILQ_INIT(&s->zpci_groups);
 869
 870    s390_pci_init_default_group();
 871    css_register_io_adapters(CSS_IO_ADAPTER_PCI, true, false,
 872                             S390_ADAPTER_SUPPRESSIBLE, errp);
 873}
 874
 875static void s390_pcihost_unrealize(DeviceState *dev)
 876{
 877    S390PCIGroup *group;
 878    S390pciState *s = S390_PCI_HOST_BRIDGE(dev);
 879
 880    while (!QTAILQ_EMPTY(&s->zpci_groups)) {
 881        group = QTAILQ_FIRST(&s->zpci_groups);
 882        QTAILQ_REMOVE(&s->zpci_groups, group, link);
 883    }
 884}
 885
 886static int s390_pci_msix_init(S390PCIBusDevice *pbdev)
 887{
 888    char *name;
 889    uint8_t pos;
 890    uint16_t ctrl;
 891    uint32_t table, pba;
 892
 893    pos = pci_find_capability(pbdev->pdev, PCI_CAP_ID_MSIX);
 894    if (!pos) {
 895        return -1;
 896    }
 897
 898    ctrl = pci_host_config_read_common(pbdev->pdev, pos + PCI_MSIX_FLAGS,
 899             pci_config_size(pbdev->pdev), sizeof(ctrl));
 900    table = pci_host_config_read_common(pbdev->pdev, pos + PCI_MSIX_TABLE,
 901             pci_config_size(pbdev->pdev), sizeof(table));
 902    pba = pci_host_config_read_common(pbdev->pdev, pos + PCI_MSIX_PBA,
 903             pci_config_size(pbdev->pdev), sizeof(pba));
 904
 905    pbdev->msix.table_bar = table & PCI_MSIX_FLAGS_BIRMASK;
 906    pbdev->msix.table_offset = table & ~PCI_MSIX_FLAGS_BIRMASK;
 907    pbdev->msix.pba_bar = pba & PCI_MSIX_FLAGS_BIRMASK;
 908    pbdev->msix.pba_offset = pba & ~PCI_MSIX_FLAGS_BIRMASK;
 909    pbdev->msix.entries = (ctrl & PCI_MSIX_FLAGS_QSIZE) + 1;
 910
 911    name = g_strdup_printf("msix-s390-%04x", pbdev->uid);
 912    memory_region_init_io(&pbdev->msix_notify_mr, OBJECT(pbdev),
 913                          &s390_msi_ctrl_ops, pbdev, name, TARGET_PAGE_SIZE);
 914    memory_region_add_subregion(&pbdev->iommu->mr,
 915                                pbdev->pci_group->zpci_group.msia,
 916                                &pbdev->msix_notify_mr);
 917    g_free(name);
 918
 919    return 0;
 920}
 921
 922static void s390_pci_msix_free(S390PCIBusDevice *pbdev)
 923{
 924    if (pbdev->msix.entries == 0) {
 925        return;
 926    }
 927
 928    memory_region_del_subregion(&pbdev->iommu->mr, &pbdev->msix_notify_mr);
 929    object_unparent(OBJECT(&pbdev->msix_notify_mr));
 930}
 931
 932static S390PCIBusDevice *s390_pci_device_new(S390pciState *s,
 933                                             const char *target, Error **errp)
 934{
 935    Error *local_err = NULL;
 936    DeviceState *dev;
 937
 938    dev = qdev_try_new(TYPE_S390_PCI_DEVICE);
 939    if (!dev) {
 940        error_setg(errp, "zPCI device could not be created");
 941        return NULL;
 942    }
 943
 944    if (!object_property_set_str(OBJECT(dev), "target", target, &local_err)) {
 945        object_unparent(OBJECT(dev));
 946        error_propagate_prepend(errp, local_err,
 947                                "zPCI device could not be created: ");
 948        return NULL;
 949    }
 950    if (!qdev_realize_and_unref(dev, BUS(s->bus), &local_err)) {
 951        object_unparent(OBJECT(dev));
 952        error_propagate_prepend(errp, local_err,
 953                                "zPCI device could not be created: ");
 954        return NULL;
 955    }
 956
 957    return S390_PCI_DEVICE(dev);
 958}
 959
 960static bool s390_pci_alloc_idx(S390pciState *s, S390PCIBusDevice *pbdev)
 961{
 962    uint32_t idx;
 963
 964    idx = s->next_idx;
 965    while (s390_pci_find_dev_by_idx(s, idx)) {
 966        idx = (idx + 1) & FH_MASK_INDEX;
 967        if (idx == s->next_idx) {
 968            return false;
 969        }
 970    }
 971
 972    pbdev->idx = idx;
 973    return true;
 974}
 975
 976static void s390_pcihost_pre_plug(HotplugHandler *hotplug_dev, DeviceState *dev,
 977                                   Error **errp)
 978{
 979    S390pciState *s = S390_PCI_HOST_BRIDGE(hotplug_dev);
 980
 981    if (!s390_has_feat(S390_FEAT_ZPCI)) {
 982        warn_report("Plugging a PCI/zPCI device without the 'zpci' CPU "
 983                    "feature enabled; the guest will not be able to see/use "
 984                    "this device");
 985    }
 986
 987    if (object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE)) {
 988        PCIDevice *pdev = PCI_DEVICE(dev);
 989
 990        if (pdev->cap_present & QEMU_PCI_CAP_MULTIFUNCTION) {
 991            error_setg(errp, "multifunction not supported in s390");
 992            return;
 993        }
 994    } else if (object_dynamic_cast(OBJECT(dev), TYPE_S390_PCI_DEVICE)) {
 995        S390PCIBusDevice *pbdev = S390_PCI_DEVICE(dev);
 996
 997        if (!s390_pci_alloc_idx(s, pbdev)) {
 998            error_setg(errp, "no slot for plugging zpci device");
 999            return;
1000        }
1001    }
1002}
1003
1004static void s390_pci_update_subordinate(PCIDevice *dev, uint32_t nr)
1005{
1006    uint32_t old_nr;
1007
1008    pci_default_write_config(dev, PCI_SUBORDINATE_BUS, nr, 1);
1009    while (!pci_bus_is_root(pci_get_bus(dev))) {
1010        dev = pci_get_bus(dev)->parent_dev;
1011
1012        old_nr = pci_default_read_config(dev, PCI_SUBORDINATE_BUS, 1);
1013        if (old_nr < nr) {
1014            pci_default_write_config(dev, PCI_SUBORDINATE_BUS, nr, 1);
1015        }
1016    }
1017}
1018
1019static int s390_pci_interp_plug(S390pciState *s, S390PCIBusDevice *pbdev)
1020{
1021    uint32_t idx, fh;
1022
1023    if (!s390_pci_get_host_fh(pbdev, &fh)) {
1024        return -EPERM;
1025    }
1026
1027    /*
1028     * The host device is already in an enabled state, but we always present
1029     * the initial device state to the guest as disabled (ZPCI_FS_DISABLED).
1030     * Therefore, mask off the enable bit from the passthrough handle until
1031     * the guest issues a CLP SET PCI FN later to enable the device.
1032     */
1033    pbdev->fh = fh & ~FH_MASK_ENABLE;
1034
1035    /* Next, see if the idx is already in-use */
1036    idx = pbdev->fh & FH_MASK_INDEX;
1037    if (pbdev->idx != idx) {
1038        if (s390_pci_find_dev_by_idx(s, idx)) {
1039            return -EINVAL;
1040        }
1041        /*
1042         * Update the idx entry with the passed through idx
1043         * If the relinquished idx is lower than next_idx, use it
1044         * to replace next_idx
1045         */
1046        g_hash_table_remove(s->zpci_table, &pbdev->idx);
1047        if (idx < s->next_idx) {
1048            s->next_idx = idx;
1049        }
1050        pbdev->idx = idx;
1051        g_hash_table_insert(s->zpci_table, &pbdev->idx, pbdev);
1052    }
1053
1054    return 0;
1055}
1056
1057static void s390_pcihost_plug(HotplugHandler *hotplug_dev, DeviceState *dev,
1058                              Error **errp)
1059{
1060    S390pciState *s = S390_PCI_HOST_BRIDGE(hotplug_dev);
1061    PCIDevice *pdev = NULL;
1062    S390PCIBusDevice *pbdev = NULL;
1063    int rc;
1064
1065    if (object_dynamic_cast(OBJECT(dev), TYPE_PCI_BRIDGE)) {
1066        PCIBridge *pb = PCI_BRIDGE(dev);
1067
1068        pdev = PCI_DEVICE(dev);
1069        pci_bridge_map_irq(pb, dev->id, s390_pci_map_irq);
1070        pci_setup_iommu(&pb->sec_bus, s390_pci_dma_iommu, s);
1071
1072        qbus_set_hotplug_handler(BUS(&pb->sec_bus), OBJECT(s));
1073
1074        if (dev->hotplugged) {
1075            pci_default_write_config(pdev, PCI_PRIMARY_BUS,
1076                                     pci_dev_bus_num(pdev), 1);
1077            s->bus_no += 1;
1078            pci_default_write_config(pdev, PCI_SECONDARY_BUS, s->bus_no, 1);
1079
1080            s390_pci_update_subordinate(pdev, s->bus_no);
1081        }
1082    } else if (object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE)) {
1083        pdev = PCI_DEVICE(dev);
1084
1085        if (!dev->id) {
1086            /* In the case the PCI device does not define an id */
1087            /* we generate one based on the PCI address         */
1088            dev->id = g_strdup_printf("auto_%02x:%02x.%01x",
1089                                      pci_dev_bus_num(pdev),
1090                                      PCI_SLOT(pdev->devfn),
1091                                      PCI_FUNC(pdev->devfn));
1092        }
1093
1094        pbdev = s390_pci_find_dev_by_target(s, dev->id);
1095        if (!pbdev) {
1096            pbdev = s390_pci_device_new(s, dev->id, errp);
1097            if (!pbdev) {
1098                return;
1099            }
1100        }
1101
1102        pbdev->pdev = pdev;
1103        pbdev->iommu = s390_pci_get_iommu(s, pci_get_bus(pdev), pdev->devfn);
1104        pbdev->iommu->pbdev = pbdev;
1105        pbdev->state = ZPCI_FS_DISABLED;
1106        set_pbdev_info(pbdev);
1107
1108        if (object_dynamic_cast(OBJECT(dev), "vfio-pci")) {
1109            /*
1110             * By default, interpretation is always requested; if the available
1111             * facilities indicate it is not available, fallback to the
1112             * interception model.
1113             */
1114            if (pbdev->interp) {
1115                if (s390_pci_kvm_interp_allowed()) {
1116                    rc = s390_pci_interp_plug(s, pbdev);
1117                    if (rc) {
1118                        error_setg(errp, "Plug failed for zPCI device in "
1119                                   "interpretation mode: %d", rc);
1120                        return;
1121                    }
1122                } else {
1123                    DPRINTF("zPCI interpretation facilities missing.\n");
1124                    pbdev->interp = false;
1125                    pbdev->forwarding_assist = false;
1126                }
1127            }
1128            pbdev->iommu->dma_limit = s390_pci_start_dma_count(s, pbdev);
1129            /* Fill in CLP information passed via the vfio region */
1130            s390_pci_get_clp_info(pbdev);
1131            if (!pbdev->interp) {
1132                /* Do vfio passthrough but intercept for I/O */
1133                pbdev->fh |= FH_SHM_VFIO;
1134                pbdev->forwarding_assist = false;
1135            }
1136            /* Register shutdown notifier and reset callback for ISM devices */
1137            if (pbdev->pft == ZPCI_PFT_ISM) {
1138                pbdev->shutdown_notifier.notify = s390_pci_shutdown_notifier;
1139                qemu_register_shutdown_notifier(&pbdev->shutdown_notifier);
1140                qemu_register_reset(s390_pci_reset_cb, pbdev);
1141            }
1142        } else {
1143            pbdev->fh |= FH_SHM_EMUL;
1144            /* Always intercept emulated devices */
1145            pbdev->interp = false;
1146            pbdev->forwarding_assist = false;
1147        }
1148
1149        if (s390_pci_msix_init(pbdev) && !pbdev->interp) {
1150            error_setg(errp, "MSI-X support is mandatory "
1151                       "in the S390 architecture");
1152            return;
1153        }
1154
1155        if (dev->hotplugged) {
1156            s390_pci_generate_plug_event(HP_EVENT_TO_CONFIGURED ,
1157                                         pbdev->fh, pbdev->fid);
1158        }
1159    } else if (object_dynamic_cast(OBJECT(dev), TYPE_S390_PCI_DEVICE)) {
1160        pbdev = S390_PCI_DEVICE(dev);
1161
1162        /* the allocated idx is actually getting used */
1163        s->next_idx = (pbdev->idx + 1) & FH_MASK_INDEX;
1164        pbdev->fh = pbdev->idx;
1165        QTAILQ_INSERT_TAIL(&s->zpci_devs, pbdev, link);
1166        g_hash_table_insert(s->zpci_table, &pbdev->idx, pbdev);
1167    } else {
1168        g_assert_not_reached();
1169    }
1170}
1171
1172static void s390_pcihost_unplug(HotplugHandler *hotplug_dev, DeviceState *dev,
1173                                Error **errp)
1174{
1175    S390pciState *s = S390_PCI_HOST_BRIDGE(hotplug_dev);
1176    S390PCIBusDevice *pbdev = NULL;
1177
1178    if (object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE)) {
1179        PCIDevice *pci_dev = PCI_DEVICE(dev);
1180        PCIBus *bus;
1181        int32_t devfn;
1182
1183        pbdev = s390_pci_find_dev_by_pci(s, PCI_DEVICE(dev));
1184        g_assert(pbdev);
1185
1186        s390_pci_generate_plug_event(HP_EVENT_STANDBY_TO_RESERVED,
1187                                     pbdev->fh, pbdev->fid);
1188        bus = pci_get_bus(pci_dev);
1189        devfn = pci_dev->devfn;
1190        qdev_unrealize(dev);
1191
1192        s390_pci_msix_free(pbdev);
1193        s390_pci_iommu_free(s, bus, devfn);
1194        pbdev->pdev = NULL;
1195        pbdev->state = ZPCI_FS_RESERVED;
1196    } else if (object_dynamic_cast(OBJECT(dev), TYPE_S390_PCI_DEVICE)) {
1197        pbdev = S390_PCI_DEVICE(dev);
1198        pbdev->fid = 0;
1199        QTAILQ_REMOVE(&s->zpci_devs, pbdev, link);
1200        g_hash_table_remove(s->zpci_table, &pbdev->idx);
1201        if (pbdev->iommu->dma_limit) {
1202            s390_pci_end_dma_count(s, pbdev->iommu->dma_limit);
1203        }
1204        qdev_unrealize(dev);
1205    }
1206}
1207
1208static void s390_pcihost_unplug_request(HotplugHandler *hotplug_dev,
1209                                        DeviceState *dev,
1210                                        Error **errp)
1211{
1212    S390pciState *s = S390_PCI_HOST_BRIDGE(hotplug_dev);
1213    S390PCIBusDevice *pbdev;
1214
1215    if (object_dynamic_cast(OBJECT(dev), TYPE_PCI_BRIDGE)) {
1216        error_setg(errp, "PCI bridge hot unplug currently not supported");
1217    } else if (object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE)) {
1218        /*
1219         * Redirect the unplug request to the zPCI device and remember that
1220         * we've checked the PCI device already (to prevent endless recursion).
1221         */
1222        pbdev = s390_pci_find_dev_by_pci(s, PCI_DEVICE(dev));
1223        g_assert(pbdev);
1224        pbdev->pci_unplug_request_processed = true;
1225        qdev_unplug(DEVICE(pbdev), errp);
1226    } else if (object_dynamic_cast(OBJECT(dev), TYPE_S390_PCI_DEVICE)) {
1227        pbdev = S390_PCI_DEVICE(dev);
1228
1229        /*
1230         * If unplug was initially requested for the zPCI device, we
1231         * first have to redirect to the PCI device, which will in return
1232         * redirect back to us after performing its checks (if the request
1233         * is not blocked, e.g. because it's a PCI bridge).
1234         */
1235        if (pbdev->pdev && !pbdev->pci_unplug_request_processed) {
1236            qdev_unplug(DEVICE(pbdev->pdev), errp);
1237            return;
1238        }
1239        pbdev->pci_unplug_request_processed = false;
1240
1241        switch (pbdev->state) {
1242        case ZPCI_FS_STANDBY:
1243        case ZPCI_FS_RESERVED:
1244            s390_pci_perform_unplug(pbdev);
1245            break;
1246        default:
1247            /*
1248             * Allow to send multiple requests, e.g. if the guest crashed
1249             * before releasing the device, we would not be able to send
1250             * another request to the same VM (e.g. fresh OS).
1251             */
1252            pbdev->unplug_requested = true;
1253            s390_pci_generate_plug_event(HP_EVENT_DECONFIGURE_REQUEST,
1254                                         pbdev->fh, pbdev->fid);
1255        }
1256    } else {
1257        g_assert_not_reached();
1258    }
1259}
1260
1261static void s390_pci_enumerate_bridge(PCIBus *bus, PCIDevice *pdev,
1262                                      void *opaque)
1263{
1264    S390pciState *s = opaque;
1265    PCIBus *sec_bus = NULL;
1266
1267    if ((pci_default_read_config(pdev, PCI_HEADER_TYPE, 1) !=
1268         PCI_HEADER_TYPE_BRIDGE)) {
1269        return;
1270    }
1271
1272    (s->bus_no)++;
1273    pci_default_write_config(pdev, PCI_PRIMARY_BUS, pci_dev_bus_num(pdev), 1);
1274    pci_default_write_config(pdev, PCI_SECONDARY_BUS, s->bus_no, 1);
1275    pci_default_write_config(pdev, PCI_SUBORDINATE_BUS, s->bus_no, 1);
1276
1277    sec_bus = pci_bridge_get_sec_bus(PCI_BRIDGE(pdev));
1278    if (!sec_bus) {
1279        return;
1280    }
1281
1282    /* Assign numbers to all child bridges. The last is the highest number. */
1283    pci_for_each_device_under_bus(sec_bus, s390_pci_enumerate_bridge, s);
1284    pci_default_write_config(pdev, PCI_SUBORDINATE_BUS, s->bus_no, 1);
1285}
1286
1287static void s390_pcihost_reset(DeviceState *dev)
1288{
1289    S390pciState *s = S390_PCI_HOST_BRIDGE(dev);
1290    PCIBus *bus = s->parent_obj.bus;
1291    S390PCIBusDevice *pbdev, *next;
1292
1293    /* Process all pending unplug requests */
1294    QTAILQ_FOREACH_SAFE(pbdev, &s->zpci_devs, link, next) {
1295        if (pbdev->unplug_requested) {
1296            if (pbdev->interp && (pbdev->fh & FH_MASK_ENABLE)) {
1297                /* Interpreted devices were using interrupt forwarding */
1298                s390_pci_kvm_aif_disable(pbdev);
1299            } else if (pbdev->summary_ind) {
1300                pci_dereg_irqs(pbdev);
1301            }
1302            if (pbdev->iommu->enabled) {
1303                pci_dereg_ioat(pbdev->iommu);
1304            }
1305            pbdev->state = ZPCI_FS_STANDBY;
1306            s390_pci_perform_unplug(pbdev);
1307        }
1308    }
1309
1310    /*
1311     * When resetting a PCI bridge, the assigned numbers are set to 0. So
1312     * on every system reset, we also have to reassign numbers.
1313     */
1314    s->bus_no = 0;
1315    pci_for_each_device_under_bus(bus, s390_pci_enumerate_bridge, s);
1316}
1317
1318static void s390_pcihost_class_init(ObjectClass *klass, void *data)
1319{
1320    DeviceClass *dc = DEVICE_CLASS(klass);
1321    HotplugHandlerClass *hc = HOTPLUG_HANDLER_CLASS(klass);
1322
1323    dc->reset = s390_pcihost_reset;
1324    dc->realize = s390_pcihost_realize;
1325    dc->unrealize = s390_pcihost_unrealize;
1326    hc->pre_plug = s390_pcihost_pre_plug;
1327    hc->plug = s390_pcihost_plug;
1328    hc->unplug_request = s390_pcihost_unplug_request;
1329    hc->unplug = s390_pcihost_unplug;
1330    msi_nonbroken = true;
1331}
1332
1333static const TypeInfo s390_pcihost_info = {
1334    .name          = TYPE_S390_PCI_HOST_BRIDGE,
1335    .parent        = TYPE_PCI_HOST_BRIDGE,
1336    .instance_size = sizeof(S390pciState),
1337    .class_init    = s390_pcihost_class_init,
1338    .interfaces = (InterfaceInfo[]) {
1339        { TYPE_HOTPLUG_HANDLER },
1340        { }
1341    }
1342};
1343
1344static const TypeInfo s390_pcibus_info = {
1345    .name = TYPE_S390_PCI_BUS,
1346    .parent = TYPE_BUS,
1347    .instance_size = sizeof(S390PCIBus),
1348};
1349
1350static uint16_t s390_pci_generate_uid(S390pciState *s)
1351{
1352    uint16_t uid = 0;
1353
1354    do {
1355        uid++;
1356        if (!s390_pci_find_dev_by_uid(s, uid)) {
1357            return uid;
1358        }
1359    } while (uid < ZPCI_MAX_UID);
1360
1361    return UID_UNDEFINED;
1362}
1363
1364static uint32_t s390_pci_generate_fid(S390pciState *s, Error **errp)
1365{
1366    uint32_t fid = 0;
1367
1368    do {
1369        if (!s390_pci_find_dev_by_fid(s, fid)) {
1370            return fid;
1371        }
1372    } while (fid++ != ZPCI_MAX_FID);
1373
1374    error_setg(errp, "no free fid could be found");
1375    return 0;
1376}
1377
1378static void s390_pci_device_realize(DeviceState *dev, Error **errp)
1379{
1380    S390PCIBusDevice *zpci = S390_PCI_DEVICE(dev);
1381    S390pciState *s = s390_get_phb();
1382
1383    if (!zpci->target) {
1384        error_setg(errp, "target must be defined");
1385        return;
1386    }
1387
1388    if (s390_pci_find_dev_by_target(s, zpci->target)) {
1389        error_setg(errp, "target %s already has an associated zpci device",
1390                   zpci->target);
1391        return;
1392    }
1393
1394    if (zpci->uid == UID_UNDEFINED) {
1395        zpci->uid = s390_pci_generate_uid(s);
1396        if (!zpci->uid) {
1397            error_setg(errp, "no free uid could be found");
1398            return;
1399        }
1400    } else if (s390_pci_find_dev_by_uid(s, zpci->uid)) {
1401        error_setg(errp, "uid %u already in use", zpci->uid);
1402        return;
1403    }
1404
1405    if (!zpci->fid_defined) {
1406        Error *local_error = NULL;
1407
1408        zpci->fid = s390_pci_generate_fid(s, &local_error);
1409        if (local_error) {
1410            error_propagate(errp, local_error);
1411            return;
1412        }
1413    } else if (s390_pci_find_dev_by_fid(s, zpci->fid)) {
1414        error_setg(errp, "fid %u already in use", zpci->fid);
1415        return;
1416    }
1417
1418    zpci->state = ZPCI_FS_RESERVED;
1419    zpci->fmb.format = ZPCI_FMB_FORMAT;
1420}
1421
1422static void s390_pci_device_reset(DeviceState *dev)
1423{
1424    S390PCIBusDevice *pbdev = S390_PCI_DEVICE(dev);
1425
1426    switch (pbdev->state) {
1427    case ZPCI_FS_RESERVED:
1428        return;
1429    case ZPCI_FS_STANDBY:
1430        break;
1431    default:
1432        pbdev->fh &= ~FH_MASK_ENABLE;
1433        pbdev->state = ZPCI_FS_DISABLED;
1434        break;
1435    }
1436
1437    if (pbdev->interp && (pbdev->fh & FH_MASK_ENABLE)) {
1438        /* Interpreted devices were using interrupt forwarding */
1439        s390_pci_kvm_aif_disable(pbdev);
1440    } else if (pbdev->summary_ind) {
1441        pci_dereg_irqs(pbdev);
1442    }
1443    if (pbdev->iommu->enabled) {
1444        pci_dereg_ioat(pbdev->iommu);
1445    }
1446
1447    fmb_timer_free(pbdev);
1448}
1449
1450static void s390_pci_get_fid(Object *obj, Visitor *v, const char *name,
1451                         void *opaque, Error **errp)
1452{
1453    Property *prop = opaque;
1454    uint32_t *ptr = object_field_prop_ptr(obj, prop);
1455
1456    visit_type_uint32(v, name, ptr, errp);
1457}
1458
1459static void s390_pci_set_fid(Object *obj, Visitor *v, const char *name,
1460                         void *opaque, Error **errp)
1461{
1462    S390PCIBusDevice *zpci = S390_PCI_DEVICE(obj);
1463    Property *prop = opaque;
1464    uint32_t *ptr = object_field_prop_ptr(obj, prop);
1465
1466    if (!visit_type_uint32(v, name, ptr, errp)) {
1467        return;
1468    }
1469    zpci->fid_defined = true;
1470}
1471
1472static const PropertyInfo s390_pci_fid_propinfo = {
1473    .name = "zpci_fid",
1474    .get = s390_pci_get_fid,
1475    .set = s390_pci_set_fid,
1476};
1477
1478#define DEFINE_PROP_S390_PCI_FID(_n, _s, _f) \
1479    DEFINE_PROP(_n, _s, _f, s390_pci_fid_propinfo, uint32_t)
1480
1481static Property s390_pci_device_properties[] = {
1482    DEFINE_PROP_UINT16("uid", S390PCIBusDevice, uid, UID_UNDEFINED),
1483    DEFINE_PROP_S390_PCI_FID("fid", S390PCIBusDevice, fid),
1484    DEFINE_PROP_STRING("target", S390PCIBusDevice, target),
1485    DEFINE_PROP_BOOL("interpret", S390PCIBusDevice, interp, true),
1486    DEFINE_PROP_BOOL("forwarding-assist", S390PCIBusDevice, forwarding_assist,
1487                     true),
1488    DEFINE_PROP_END_OF_LIST(),
1489};
1490
1491static const VMStateDescription s390_pci_device_vmstate = {
1492    .name = TYPE_S390_PCI_DEVICE,
1493    /*
1494     * TODO: add state handling here, so migration works at least with
1495     * emulated pci devices on s390x
1496     */
1497    .unmigratable = 1,
1498};
1499
1500static void s390_pci_device_class_init(ObjectClass *klass, void *data)
1501{
1502    DeviceClass *dc = DEVICE_CLASS(klass);
1503
1504    dc->desc = "zpci device";
1505    set_bit(DEVICE_CATEGORY_MISC, dc->categories);
1506    dc->reset = s390_pci_device_reset;
1507    dc->bus_type = TYPE_S390_PCI_BUS;
1508    dc->realize = s390_pci_device_realize;
1509    device_class_set_props(dc, s390_pci_device_properties);
1510    dc->vmsd = &s390_pci_device_vmstate;
1511}
1512
1513static const TypeInfo s390_pci_device_info = {
1514    .name = TYPE_S390_PCI_DEVICE,
1515    .parent = TYPE_DEVICE,
1516    .instance_size = sizeof(S390PCIBusDevice),
1517    .class_init = s390_pci_device_class_init,
1518};
1519
1520static const TypeInfo s390_pci_iommu_info = {
1521    .name = TYPE_S390_PCI_IOMMU,
1522    .parent = TYPE_OBJECT,
1523    .instance_size = sizeof(S390PCIIOMMU),
1524};
1525
1526static void s390_iommu_memory_region_class_init(ObjectClass *klass, void *data)
1527{
1528    IOMMUMemoryRegionClass *imrc = IOMMU_MEMORY_REGION_CLASS(klass);
1529
1530    imrc->translate = s390_translate_iommu;
1531    imrc->replay = s390_pci_iommu_replay;
1532}
1533
1534static const TypeInfo s390_iommu_memory_region_info = {
1535    .parent = TYPE_IOMMU_MEMORY_REGION,
1536    .name = TYPE_S390_IOMMU_MEMORY_REGION,
1537    .class_init = s390_iommu_memory_region_class_init,
1538};
1539
1540static void s390_pci_register_types(void)
1541{
1542    type_register_static(&s390_pcihost_info);
1543    type_register_static(&s390_pcibus_info);
1544    type_register_static(&s390_pci_device_info);
1545    type_register_static(&s390_pci_iommu_info);
1546    type_register_static(&s390_iommu_memory_region_info);
1547}
1548
1549type_init(s390_pci_register_types)
1550