linux/arch/sparc/kernel/pci_sun4v.c
<<
>>
Prefs
   1// SPDX-License-Identifier: GPL-2.0
   2/* pci_sun4v.c: SUN4V specific PCI controller support.
   3 *
   4 * Copyright (C) 2006, 2007, 2008 David S. Miller (davem@davemloft.net)
   5 */
   6
   7#include <linux/kernel.h>
   8#include <linux/types.h>
   9#include <linux/pci.h>
  10#include <linux/init.h>
  11#include <linux/slab.h>
  12#include <linux/interrupt.h>
  13#include <linux/percpu.h>
  14#include <linux/irq.h>
  15#include <linux/msi.h>
  16#include <linux/export.h>
  17#include <linux/log2.h>
  18#include <linux/of_device.h>
  19#include <asm/iommu-common.h>
  20
  21#include <asm/iommu.h>
  22#include <asm/irq.h>
  23#include <asm/hypervisor.h>
  24#include <asm/prom.h>
  25
  26#include "pci_impl.h"
  27#include "iommu_common.h"
  28#include "kernel.h"
  29
  30#include "pci_sun4v.h"
  31
  32#define DRIVER_NAME     "pci_sun4v"
  33#define PFX             DRIVER_NAME ": "
  34
  35static unsigned long vpci_major;
  36static unsigned long vpci_minor;
  37
  38struct vpci_version {
  39        unsigned long major;
  40        unsigned long minor;
  41};
  42
  43/* Ordered from largest major to lowest */
  44static struct vpci_version vpci_versions[] = {
  45        { .major = 2, .minor = 0 },
  46        { .major = 1, .minor = 1 },
  47};
  48
  49static unsigned long vatu_major = 1;
  50static unsigned long vatu_minor = 1;
  51
  52#define PGLIST_NENTS    (PAGE_SIZE / sizeof(u64))
  53
  54struct iommu_batch {
  55        struct device   *dev;           /* Device mapping is for.       */
  56        unsigned long   prot;           /* IOMMU page protections       */
  57        unsigned long   entry;          /* Index into IOTSB.            */
  58        u64             *pglist;        /* List of physical pages       */
  59        unsigned long   npages;         /* Number of pages in list.     */
  60};
  61
  62static DEFINE_PER_CPU(struct iommu_batch, iommu_batch);
  63static int iommu_batch_initialized;
  64
  65/* Interrupts must be disabled.  */
  66static inline void iommu_batch_start(struct device *dev, unsigned long prot, unsigned long entry)
  67{
  68        struct iommu_batch *p = this_cpu_ptr(&iommu_batch);
  69
  70        p->dev          = dev;
  71        p->prot         = prot;
  72        p->entry        = entry;
  73        p->npages       = 0;
  74}
  75
  76static inline bool iommu_use_atu(struct iommu *iommu, u64 mask)
  77{
  78        return iommu->atu && mask > DMA_BIT_MASK(32);
  79}
  80
  81/* Interrupts must be disabled.  */
  82static long iommu_batch_flush(struct iommu_batch *p, u64 mask)
  83{
  84        struct pci_pbm_info *pbm = p->dev->archdata.host_controller;
  85        u64 *pglist = p->pglist;
  86        u64 index_count;
  87        unsigned long devhandle = pbm->devhandle;
  88        unsigned long prot = p->prot;
  89        unsigned long entry = p->entry;
  90        unsigned long npages = p->npages;
  91        unsigned long iotsb_num;
  92        unsigned long ret;
  93        long num;
  94
  95        /* VPCI maj=1, min=[0,1] only supports read and write */
  96        if (vpci_major < 2)
  97                prot &= (HV_PCI_MAP_ATTR_READ | HV_PCI_MAP_ATTR_WRITE);
  98
  99        while (npages != 0) {
 100                if (!iommu_use_atu(pbm->iommu, mask)) {
 101                        num = pci_sun4v_iommu_map(devhandle,
 102                                                  HV_PCI_TSBID(0, entry),
 103                                                  npages,
 104                                                  prot,
 105                                                  __pa(pglist));
 106                        if (unlikely(num < 0)) {
 107                                pr_err_ratelimited("%s: IOMMU map of [%08lx:%08llx:%lx:%lx:%lx] failed with status %ld\n",
 108                                                   __func__,
 109                                                   devhandle,
 110                                                   HV_PCI_TSBID(0, entry),
 111                                                   npages, prot, __pa(pglist),
 112                                                   num);
 113                                return -1;
 114                        }
 115                } else {
 116                        index_count = HV_PCI_IOTSB_INDEX_COUNT(npages, entry),
 117                        iotsb_num = pbm->iommu->atu->iotsb->iotsb_num;
 118                        ret = pci_sun4v_iotsb_map(devhandle,
 119                                                  iotsb_num,
 120                                                  index_count,
 121                                                  prot,
 122                                                  __pa(pglist),
 123                                                  &num);
 124                        if (unlikely(ret != HV_EOK)) {
 125                                pr_err_ratelimited("%s: ATU map of [%08lx:%lx:%llx:%lx:%lx] failed with status %ld\n",
 126                                                   __func__,
 127                                                   devhandle, iotsb_num,
 128                                                   index_count, prot,
 129                                                   __pa(pglist), ret);
 130                                return -1;
 131                        }
 132                }
 133                entry += num;
 134                npages -= num;
 135                pglist += num;
 136        }
 137
 138        p->entry = entry;
 139        p->npages = 0;
 140
 141        return 0;
 142}
 143
 144static inline void iommu_batch_new_entry(unsigned long entry, u64 mask)
 145{
 146        struct iommu_batch *p = this_cpu_ptr(&iommu_batch);
 147
 148        if (p->entry + p->npages == entry)
 149                return;
 150        if (p->entry != ~0UL)
 151                iommu_batch_flush(p, mask);
 152        p->entry = entry;
 153}
 154
 155/* Interrupts must be disabled.  */
 156static inline long iommu_batch_add(u64 phys_page, u64 mask)
 157{
 158        struct iommu_batch *p = this_cpu_ptr(&iommu_batch);
 159
 160        BUG_ON(p->npages >= PGLIST_NENTS);
 161
 162        p->pglist[p->npages++] = phys_page;
 163        if (p->npages == PGLIST_NENTS)
 164                return iommu_batch_flush(p, mask);
 165
 166        return 0;
 167}
 168
 169/* Interrupts must be disabled.  */
 170static inline long iommu_batch_end(u64 mask)
 171{
 172        struct iommu_batch *p = this_cpu_ptr(&iommu_batch);
 173
 174        BUG_ON(p->npages >= PGLIST_NENTS);
 175
 176        return iommu_batch_flush(p, mask);
 177}
 178
 179static void *dma_4v_alloc_coherent(struct device *dev, size_t size,
 180                                   dma_addr_t *dma_addrp, gfp_t gfp,
 181                                   unsigned long attrs)
 182{
 183        u64 mask;
 184        unsigned long flags, order, first_page, npages, n;
 185        unsigned long prot = 0;
 186        struct iommu *iommu;
 187        struct iommu_map_table *tbl;
 188        struct page *page;
 189        void *ret;
 190        long entry;
 191        int nid;
 192
 193        size = IO_PAGE_ALIGN(size);
 194        order = get_order(size);
 195        if (unlikely(order >= MAX_ORDER))
 196                return NULL;
 197
 198        npages = size >> IO_PAGE_SHIFT;
 199
 200        if (attrs & DMA_ATTR_WEAK_ORDERING)
 201                prot = HV_PCI_MAP_ATTR_RELAXED_ORDER;
 202
 203        nid = dev->archdata.numa_node;
 204        page = alloc_pages_node(nid, gfp, order);
 205        if (unlikely(!page))
 206                return NULL;
 207
 208        first_page = (unsigned long) page_address(page);
 209        memset((char *)first_page, 0, PAGE_SIZE << order);
 210
 211        iommu = dev->archdata.iommu;
 212        mask = dev->coherent_dma_mask;
 213        if (!iommu_use_atu(iommu, mask))
 214                tbl = &iommu->tbl;
 215        else
 216                tbl = &iommu->atu->tbl;
 217
 218        entry = iommu_tbl_range_alloc(dev, tbl, npages, NULL,
 219                                      (unsigned long)(-1), 0);
 220
 221        if (unlikely(entry == IOMMU_ERROR_CODE))
 222                goto range_alloc_fail;
 223
 224        *dma_addrp = (tbl->table_map_base + (entry << IO_PAGE_SHIFT));
 225        ret = (void *) first_page;
 226        first_page = __pa(first_page);
 227
 228        local_irq_save(flags);
 229
 230        iommu_batch_start(dev,
 231                          (HV_PCI_MAP_ATTR_READ | prot |
 232                           HV_PCI_MAP_ATTR_WRITE),
 233                          entry);
 234
 235        for (n = 0; n < npages; n++) {
 236                long err = iommu_batch_add(first_page + (n * PAGE_SIZE), mask);
 237                if (unlikely(err < 0L))
 238                        goto iommu_map_fail;
 239        }
 240
 241        if (unlikely(iommu_batch_end(mask) < 0L))
 242                goto iommu_map_fail;
 243
 244        local_irq_restore(flags);
 245
 246        return ret;
 247
 248iommu_map_fail:
 249        local_irq_restore(flags);
 250        iommu_tbl_range_free(tbl, *dma_addrp, npages, IOMMU_ERROR_CODE);
 251
 252range_alloc_fail:
 253        free_pages(first_page, order);
 254        return NULL;
 255}
 256
 257unsigned long dma_4v_iotsb_bind(unsigned long devhandle,
 258                                unsigned long iotsb_num,
 259                                struct pci_bus *bus_dev)
 260{
 261        struct pci_dev *pdev;
 262        unsigned long err;
 263        unsigned int bus;
 264        unsigned int device;
 265        unsigned int fun;
 266
 267        list_for_each_entry(pdev, &bus_dev->devices, bus_list) {
 268                if (pdev->subordinate) {
 269                        /* No need to bind pci bridge */
 270                        dma_4v_iotsb_bind(devhandle, iotsb_num,
 271                                          pdev->subordinate);
 272                } else {
 273                        bus = bus_dev->number;
 274                        device = PCI_SLOT(pdev->devfn);
 275                        fun = PCI_FUNC(pdev->devfn);
 276                        err = pci_sun4v_iotsb_bind(devhandle, iotsb_num,
 277                                                   HV_PCI_DEVICE_BUILD(bus,
 278                                                                       device,
 279                                                                       fun));
 280
 281                        /* If bind fails for one device it is going to fail
 282                         * for rest of the devices because we are sharing
 283                         * IOTSB. So in case of failure simply return with
 284                         * error.
 285                         */
 286                        if (err)
 287                                return err;
 288                }
 289        }
 290
 291        return 0;
 292}
 293
 294static void dma_4v_iommu_demap(struct device *dev, unsigned long devhandle,
 295                               dma_addr_t dvma, unsigned long iotsb_num,
 296                               unsigned long entry, unsigned long npages)
 297{
 298        unsigned long num, flags;
 299        unsigned long ret;
 300
 301        local_irq_save(flags);
 302        do {
 303                if (dvma <= DMA_BIT_MASK(32)) {
 304                        num = pci_sun4v_iommu_demap(devhandle,
 305                                                    HV_PCI_TSBID(0, entry),
 306                                                    npages);
 307                } else {
 308                        ret = pci_sun4v_iotsb_demap(devhandle, iotsb_num,
 309                                                    entry, npages, &num);
 310                        if (unlikely(ret != HV_EOK)) {
 311                                pr_err_ratelimited("pci_iotsb_demap() failed with error: %ld\n",
 312                                                   ret);
 313                        }
 314                }
 315                entry += num;
 316                npages -= num;
 317        } while (npages != 0);
 318        local_irq_restore(flags);
 319}
 320
 321static void dma_4v_free_coherent(struct device *dev, size_t size, void *cpu,
 322                                 dma_addr_t dvma, unsigned long attrs)
 323{
 324        struct pci_pbm_info *pbm;
 325        struct iommu *iommu;
 326        struct atu *atu;
 327        struct iommu_map_table *tbl;
 328        unsigned long order, npages, entry;
 329        unsigned long iotsb_num;
 330        u32 devhandle;
 331
 332        npages = IO_PAGE_ALIGN(size) >> IO_PAGE_SHIFT;
 333        iommu = dev->archdata.iommu;
 334        pbm = dev->archdata.host_controller;
 335        atu = iommu->atu;
 336        devhandle = pbm->devhandle;
 337
 338        if (!iommu_use_atu(iommu, dvma)) {
 339                tbl = &iommu->tbl;
 340                iotsb_num = 0; /* we don't care for legacy iommu */
 341        } else {
 342                tbl = &atu->tbl;
 343                iotsb_num = atu->iotsb->iotsb_num;
 344        }
 345        entry = ((dvma - tbl->table_map_base) >> IO_PAGE_SHIFT);
 346        dma_4v_iommu_demap(dev, devhandle, dvma, iotsb_num, entry, npages);
 347        iommu_tbl_range_free(tbl, dvma, npages, IOMMU_ERROR_CODE);
 348        order = get_order(size);
 349        if (order < 10)
 350                free_pages((unsigned long)cpu, order);
 351}
 352
 353static dma_addr_t dma_4v_map_page(struct device *dev, struct page *page,
 354                                  unsigned long offset, size_t sz,
 355                                  enum dma_data_direction direction,
 356                                  unsigned long attrs)
 357{
 358        struct iommu *iommu;
 359        struct atu *atu;
 360        struct iommu_map_table *tbl;
 361        u64 mask;
 362        unsigned long flags, npages, oaddr;
 363        unsigned long i, base_paddr;
 364        unsigned long prot;
 365        dma_addr_t bus_addr, ret;
 366        long entry;
 367
 368        iommu = dev->archdata.iommu;
 369        atu = iommu->atu;
 370
 371        if (unlikely(direction == DMA_NONE))
 372                goto bad;
 373
 374        oaddr = (unsigned long)(page_address(page) + offset);
 375        npages = IO_PAGE_ALIGN(oaddr + sz) - (oaddr & IO_PAGE_MASK);
 376        npages >>= IO_PAGE_SHIFT;
 377
 378        mask = *dev->dma_mask;
 379        if (!iommu_use_atu(iommu, mask))
 380                tbl = &iommu->tbl;
 381        else
 382                tbl = &atu->tbl;
 383
 384        entry = iommu_tbl_range_alloc(dev, tbl, npages, NULL,
 385                                      (unsigned long)(-1), 0);
 386
 387        if (unlikely(entry == IOMMU_ERROR_CODE))
 388                goto bad;
 389
 390        bus_addr = (tbl->table_map_base + (entry << IO_PAGE_SHIFT));
 391        ret = bus_addr | (oaddr & ~IO_PAGE_MASK);
 392        base_paddr = __pa(oaddr & IO_PAGE_MASK);
 393        prot = HV_PCI_MAP_ATTR_READ;
 394        if (direction != DMA_TO_DEVICE)
 395                prot |= HV_PCI_MAP_ATTR_WRITE;
 396
 397        if (attrs & DMA_ATTR_WEAK_ORDERING)
 398                prot |= HV_PCI_MAP_ATTR_RELAXED_ORDER;
 399
 400        local_irq_save(flags);
 401
 402        iommu_batch_start(dev, prot, entry);
 403
 404        for (i = 0; i < npages; i++, base_paddr += IO_PAGE_SIZE) {
 405                long err = iommu_batch_add(base_paddr, mask);
 406                if (unlikely(err < 0L))
 407                        goto iommu_map_fail;
 408        }
 409        if (unlikely(iommu_batch_end(mask) < 0L))
 410                goto iommu_map_fail;
 411
 412        local_irq_restore(flags);
 413
 414        return ret;
 415
 416bad:
 417        if (printk_ratelimit())
 418                WARN_ON(1);
 419        return DMA_MAPPING_ERROR;
 420
 421iommu_map_fail:
 422        local_irq_restore(flags);
 423        iommu_tbl_range_free(tbl, bus_addr, npages, IOMMU_ERROR_CODE);
 424        return DMA_MAPPING_ERROR;
 425}
 426
 427static void dma_4v_unmap_page(struct device *dev, dma_addr_t bus_addr,
 428                              size_t sz, enum dma_data_direction direction,
 429                              unsigned long attrs)
 430{
 431        struct pci_pbm_info *pbm;
 432        struct iommu *iommu;
 433        struct atu *atu;
 434        struct iommu_map_table *tbl;
 435        unsigned long npages;
 436        unsigned long iotsb_num;
 437        long entry;
 438        u32 devhandle;
 439
 440        if (unlikely(direction == DMA_NONE)) {
 441                if (printk_ratelimit())
 442                        WARN_ON(1);
 443                return;
 444        }
 445
 446        iommu = dev->archdata.iommu;
 447        pbm = dev->archdata.host_controller;
 448        atu = iommu->atu;
 449        devhandle = pbm->devhandle;
 450
 451        npages = IO_PAGE_ALIGN(bus_addr + sz) - (bus_addr & IO_PAGE_MASK);
 452        npages >>= IO_PAGE_SHIFT;
 453        bus_addr &= IO_PAGE_MASK;
 454
 455        if (bus_addr <= DMA_BIT_MASK(32)) {
 456                iotsb_num = 0; /* we don't care for legacy iommu */
 457                tbl = &iommu->tbl;
 458        } else {
 459                iotsb_num = atu->iotsb->iotsb_num;
 460                tbl = &atu->tbl;
 461        }
 462        entry = (bus_addr - tbl->table_map_base) >> IO_PAGE_SHIFT;
 463        dma_4v_iommu_demap(dev, devhandle, bus_addr, iotsb_num, entry, npages);
 464        iommu_tbl_range_free(tbl, bus_addr, npages, IOMMU_ERROR_CODE);
 465}
 466
 467static int dma_4v_map_sg(struct device *dev, struct scatterlist *sglist,
 468                         int nelems, enum dma_data_direction direction,
 469                         unsigned long attrs)
 470{
 471        struct scatterlist *s, *outs, *segstart;
 472        unsigned long flags, handle, prot;
 473        dma_addr_t dma_next = 0, dma_addr;
 474        unsigned int max_seg_size;
 475        unsigned long seg_boundary_size;
 476        int outcount, incount, i;
 477        struct iommu *iommu;
 478        struct atu *atu;
 479        struct iommu_map_table *tbl;
 480        u64 mask;
 481        unsigned long base_shift;
 482        long err;
 483
 484        BUG_ON(direction == DMA_NONE);
 485
 486        iommu = dev->archdata.iommu;
 487        if (nelems == 0 || !iommu)
 488                return 0;
 489        atu = iommu->atu;
 490
 491        prot = HV_PCI_MAP_ATTR_READ;
 492        if (direction != DMA_TO_DEVICE)
 493                prot |= HV_PCI_MAP_ATTR_WRITE;
 494
 495        if (attrs & DMA_ATTR_WEAK_ORDERING)
 496                prot |= HV_PCI_MAP_ATTR_RELAXED_ORDER;
 497
 498        outs = s = segstart = &sglist[0];
 499        outcount = 1;
 500        incount = nelems;
 501        handle = 0;
 502
 503        /* Init first segment length for backout at failure */
 504        outs->dma_length = 0;
 505
 506        local_irq_save(flags);
 507
 508        iommu_batch_start(dev, prot, ~0UL);
 509
 510        max_seg_size = dma_get_max_seg_size(dev);
 511        seg_boundary_size = ALIGN(dma_get_seg_boundary(dev) + 1,
 512                                  IO_PAGE_SIZE) >> IO_PAGE_SHIFT;
 513
 514        mask = *dev->dma_mask;
 515        if (!iommu_use_atu(iommu, mask))
 516                tbl = &iommu->tbl;
 517        else
 518                tbl = &atu->tbl;
 519
 520        base_shift = tbl->table_map_base >> IO_PAGE_SHIFT;
 521
 522        for_each_sg(sglist, s, nelems, i) {
 523                unsigned long paddr, npages, entry, out_entry = 0, slen;
 524
 525                slen = s->length;
 526                /* Sanity check */
 527                if (slen == 0) {
 528                        dma_next = 0;
 529                        continue;
 530                }
 531                /* Allocate iommu entries for that segment */
 532                paddr = (unsigned long) SG_ENT_PHYS_ADDRESS(s);
 533                npages = iommu_num_pages(paddr, slen, IO_PAGE_SIZE);
 534                entry = iommu_tbl_range_alloc(dev, tbl, npages,
 535                                              &handle, (unsigned long)(-1), 0);
 536
 537                /* Handle failure */
 538                if (unlikely(entry == IOMMU_ERROR_CODE)) {
 539                        pr_err_ratelimited("iommu_alloc failed, iommu %p paddr %lx npages %lx\n",
 540                                           tbl, paddr, npages);
 541                        goto iommu_map_failed;
 542                }
 543
 544                iommu_batch_new_entry(entry, mask);
 545
 546                /* Convert entry to a dma_addr_t */
 547                dma_addr = tbl->table_map_base + (entry << IO_PAGE_SHIFT);
 548                dma_addr |= (s->offset & ~IO_PAGE_MASK);
 549
 550                /* Insert into HW table */
 551                paddr &= IO_PAGE_MASK;
 552                while (npages--) {
 553                        err = iommu_batch_add(paddr, mask);
 554                        if (unlikely(err < 0L))
 555                                goto iommu_map_failed;
 556                        paddr += IO_PAGE_SIZE;
 557                }
 558
 559                /* If we are in an open segment, try merging */
 560                if (segstart != s) {
 561                        /* We cannot merge if:
 562                         * - allocated dma_addr isn't contiguous to previous allocation
 563                         */
 564                        if ((dma_addr != dma_next) ||
 565                            (outs->dma_length + s->length > max_seg_size) ||
 566                            (is_span_boundary(out_entry, base_shift,
 567                                              seg_boundary_size, outs, s))) {
 568                                /* Can't merge: create a new segment */
 569                                segstart = s;
 570                                outcount++;
 571                                outs = sg_next(outs);
 572                        } else {
 573                                outs->dma_length += s->length;
 574                        }
 575                }
 576
 577                if (segstart == s) {
 578                        /* This is a new segment, fill entries */
 579                        outs->dma_address = dma_addr;
 580                        outs->dma_length = slen;
 581                        out_entry = entry;
 582                }
 583
 584                /* Calculate next page pointer for contiguous check */
 585                dma_next = dma_addr + slen;
 586        }
 587
 588        err = iommu_batch_end(mask);
 589
 590        if (unlikely(err < 0L))
 591                goto iommu_map_failed;
 592
 593        local_irq_restore(flags);
 594
 595        if (outcount < incount) {
 596                outs = sg_next(outs);
 597                outs->dma_address = DMA_MAPPING_ERROR;
 598                outs->dma_length = 0;
 599        }
 600
 601        return outcount;
 602
 603iommu_map_failed:
 604        for_each_sg(sglist, s, nelems, i) {
 605                if (s->dma_length != 0) {
 606                        unsigned long vaddr, npages;
 607
 608                        vaddr = s->dma_address & IO_PAGE_MASK;
 609                        npages = iommu_num_pages(s->dma_address, s->dma_length,
 610                                                 IO_PAGE_SIZE);
 611                        iommu_tbl_range_free(tbl, vaddr, npages,
 612                                             IOMMU_ERROR_CODE);
 613                        /* XXX demap? XXX */
 614                        s->dma_address = DMA_MAPPING_ERROR;
 615                        s->dma_length = 0;
 616                }
 617                if (s == outs)
 618                        break;
 619        }
 620        local_irq_restore(flags);
 621
 622        return 0;
 623}
 624
 625static void dma_4v_unmap_sg(struct device *dev, struct scatterlist *sglist,
 626                            int nelems, enum dma_data_direction direction,
 627                            unsigned long attrs)
 628{
 629        struct pci_pbm_info *pbm;
 630        struct scatterlist *sg;
 631        struct iommu *iommu;
 632        struct atu *atu;
 633        unsigned long flags, entry;
 634        unsigned long iotsb_num;
 635        u32 devhandle;
 636
 637        BUG_ON(direction == DMA_NONE);
 638
 639        iommu = dev->archdata.iommu;
 640        pbm = dev->archdata.host_controller;
 641        atu = iommu->atu;
 642        devhandle = pbm->devhandle;
 643        
 644        local_irq_save(flags);
 645
 646        sg = sglist;
 647        while (nelems--) {
 648                dma_addr_t dma_handle = sg->dma_address;
 649                unsigned int len = sg->dma_length;
 650                unsigned long npages;
 651                struct iommu_map_table *tbl;
 652                unsigned long shift = IO_PAGE_SHIFT;
 653
 654                if (!len)
 655                        break;
 656                npages = iommu_num_pages(dma_handle, len, IO_PAGE_SIZE);
 657
 658                if (dma_handle <= DMA_BIT_MASK(32)) {
 659                        iotsb_num = 0; /* we don't care for legacy iommu */
 660                        tbl = &iommu->tbl;
 661                } else {
 662                        iotsb_num = atu->iotsb->iotsb_num;
 663                        tbl = &atu->tbl;
 664                }
 665                entry = ((dma_handle - tbl->table_map_base) >> shift);
 666                dma_4v_iommu_demap(dev, devhandle, dma_handle, iotsb_num,
 667                                   entry, npages);
 668                iommu_tbl_range_free(tbl, dma_handle, npages,
 669                                     IOMMU_ERROR_CODE);
 670                sg = sg_next(sg);
 671        }
 672
 673        local_irq_restore(flags);
 674}
 675
 676static int dma_4v_supported(struct device *dev, u64 device_mask)
 677{
 678        struct iommu *iommu = dev->archdata.iommu;
 679
 680        if (ali_sound_dma_hack(dev, device_mask))
 681                return 1;
 682        if (device_mask < iommu->dma_addr_mask)
 683                return 0;
 684        return 1;
 685}
 686
 687static const struct dma_map_ops sun4v_dma_ops = {
 688        .alloc                          = dma_4v_alloc_coherent,
 689        .free                           = dma_4v_free_coherent,
 690        .map_page                       = dma_4v_map_page,
 691        .unmap_page                     = dma_4v_unmap_page,
 692        .map_sg                         = dma_4v_map_sg,
 693        .unmap_sg                       = dma_4v_unmap_sg,
 694        .dma_supported                  = dma_4v_supported,
 695};
 696
 697static void pci_sun4v_scan_bus(struct pci_pbm_info *pbm, struct device *parent)
 698{
 699        struct property *prop;
 700        struct device_node *dp;
 701
 702        dp = pbm->op->dev.of_node;
 703        prop = of_find_property(dp, "66mhz-capable", NULL);
 704        pbm->is_66mhz_capable = (prop != NULL);
 705        pbm->pci_bus = pci_scan_one_pbm(pbm, parent);
 706
 707        /* XXX register error interrupt handlers XXX */
 708}
 709
 710static unsigned long probe_existing_entries(struct pci_pbm_info *pbm,
 711                                            struct iommu_map_table *iommu)
 712{
 713        struct iommu_pool *pool;
 714        unsigned long i, pool_nr, cnt = 0;
 715        u32 devhandle;
 716
 717        devhandle = pbm->devhandle;
 718        for (pool_nr = 0; pool_nr < iommu->nr_pools; pool_nr++) {
 719                pool = &(iommu->pools[pool_nr]);
 720                for (i = pool->start; i <= pool->end; i++) {
 721                        unsigned long ret, io_attrs, ra;
 722
 723                        ret = pci_sun4v_iommu_getmap(devhandle,
 724                                                     HV_PCI_TSBID(0, i),
 725                                                     &io_attrs, &ra);
 726                        if (ret == HV_EOK) {
 727                                if (page_in_phys_avail(ra)) {
 728                                        pci_sun4v_iommu_demap(devhandle,
 729                                                              HV_PCI_TSBID(0,
 730                                                              i), 1);
 731                                } else {
 732                                        cnt++;
 733                                        __set_bit(i, iommu->map);
 734                                }
 735                        }
 736                }
 737        }
 738        return cnt;
 739}
 740
 741static int pci_sun4v_atu_alloc_iotsb(struct pci_pbm_info *pbm)
 742{
 743        struct atu *atu = pbm->iommu->atu;
 744        struct atu_iotsb *iotsb;
 745        void *table;
 746        u64 table_size;
 747        u64 iotsb_num;
 748        unsigned long order;
 749        unsigned long err;
 750
 751        iotsb = kzalloc(sizeof(*iotsb), GFP_KERNEL);
 752        if (!iotsb) {
 753                err = -ENOMEM;
 754                goto out_err;
 755        }
 756        atu->iotsb = iotsb;
 757
 758        /* calculate size of IOTSB */
 759        table_size = (atu->size / IO_PAGE_SIZE) * 8;
 760        order = get_order(table_size);
 761        table = (void *)__get_free_pages(GFP_KERNEL | __GFP_ZERO, order);
 762        if (!table) {
 763                err = -ENOMEM;
 764                goto table_failed;
 765        }
 766        iotsb->table = table;
 767        iotsb->ra = __pa(table);
 768        iotsb->dvma_size = atu->size;
 769        iotsb->dvma_base = atu->base;
 770        iotsb->table_size = table_size;
 771        iotsb->page_size = IO_PAGE_SIZE;
 772
 773        /* configure and register IOTSB with HV */
 774        err = pci_sun4v_iotsb_conf(pbm->devhandle,
 775                                   iotsb->ra,
 776                                   iotsb->table_size,
 777                                   iotsb->page_size,
 778                                   iotsb->dvma_base,
 779                                   &iotsb_num);
 780        if (err) {
 781                pr_err(PFX "pci_iotsb_conf failed error: %ld\n", err);
 782                goto iotsb_conf_failed;
 783        }
 784        iotsb->iotsb_num = iotsb_num;
 785
 786        err = dma_4v_iotsb_bind(pbm->devhandle, iotsb_num, pbm->pci_bus);
 787        if (err) {
 788                pr_err(PFX "pci_iotsb_bind failed error: %ld\n", err);
 789                goto iotsb_conf_failed;
 790        }
 791
 792        return 0;
 793
 794iotsb_conf_failed:
 795        free_pages((unsigned long)table, order);
 796table_failed:
 797        kfree(iotsb);
 798out_err:
 799        return err;
 800}
 801
 802static int pci_sun4v_atu_init(struct pci_pbm_info *pbm)
 803{
 804        struct atu *atu = pbm->iommu->atu;
 805        unsigned long err;
 806        const u64 *ranges;
 807        u64 map_size, num_iotte;
 808        u64 dma_mask;
 809        const u32 *page_size;
 810        int len;
 811
 812        ranges = of_get_property(pbm->op->dev.of_node, "iommu-address-ranges",
 813                                 &len);
 814        if (!ranges) {
 815                pr_err(PFX "No iommu-address-ranges\n");
 816                return -EINVAL;
 817        }
 818
 819        page_size = of_get_property(pbm->op->dev.of_node, "iommu-pagesizes",
 820                                    NULL);
 821        if (!page_size) {
 822                pr_err(PFX "No iommu-pagesizes\n");
 823                return -EINVAL;
 824        }
 825
 826        /* There are 4 iommu-address-ranges supported. Each range is pair of
 827         * {base, size}. The ranges[0] and ranges[1] are 32bit address space
 828         * while ranges[2] and ranges[3] are 64bit space.  We want to use 64bit
 829         * address ranges to support 64bit addressing. Because 'size' for
 830         * address ranges[2] and ranges[3] are same we can select either of
 831         * ranges[2] or ranges[3] for mapping. However due to 'size' is too
 832         * large for OS to allocate IOTSB we are using fix size 32G
 833         * (ATU_64_SPACE_SIZE) which is more than enough for all PCIe devices
 834         * to share.
 835         */
 836        atu->ranges = (struct atu_ranges *)ranges;
 837        atu->base = atu->ranges[3].base;
 838        atu->size = ATU_64_SPACE_SIZE;
 839
 840        /* Create IOTSB */
 841        err = pci_sun4v_atu_alloc_iotsb(pbm);
 842        if (err) {
 843                pr_err(PFX "Error creating ATU IOTSB\n");
 844                return err;
 845        }
 846
 847        /* Create ATU iommu map.
 848         * One bit represents one iotte in IOTSB table.
 849         */
 850        dma_mask = (roundup_pow_of_two(atu->size) - 1UL);
 851        num_iotte = atu->size / IO_PAGE_SIZE;
 852        map_size = num_iotte / 8;
 853        atu->tbl.table_map_base = atu->base;
 854        atu->dma_addr_mask = dma_mask;
 855        atu->tbl.map = kzalloc(map_size, GFP_KERNEL);
 856        if (!atu->tbl.map)
 857                return -ENOMEM;
 858
 859        iommu_tbl_pool_init(&atu->tbl, num_iotte, IO_PAGE_SHIFT,
 860                            NULL, false /* no large_pool */,
 861                            0 /* default npools */,
 862                            false /* want span boundary checking */);
 863
 864        return 0;
 865}
 866
 867static int pci_sun4v_iommu_init(struct pci_pbm_info *pbm)
 868{
 869        static const u32 vdma_default[] = { 0x80000000, 0x80000000 };
 870        struct iommu *iommu = pbm->iommu;
 871        unsigned long num_tsb_entries, sz;
 872        u32 dma_mask, dma_offset;
 873        const u32 *vdma;
 874
 875        vdma = of_get_property(pbm->op->dev.of_node, "virtual-dma", NULL);
 876        if (!vdma)
 877                vdma = vdma_default;
 878
 879        if ((vdma[0] | vdma[1]) & ~IO_PAGE_MASK) {
 880                printk(KERN_ERR PFX "Strange virtual-dma[%08x:%08x].\n",
 881                       vdma[0], vdma[1]);
 882                return -EINVAL;
 883        }
 884
 885        dma_mask = (roundup_pow_of_two(vdma[1]) - 1UL);
 886        num_tsb_entries = vdma[1] / IO_PAGE_SIZE;
 887
 888        dma_offset = vdma[0];
 889
 890        /* Setup initial software IOMMU state. */
 891        spin_lock_init(&iommu->lock);
 892        iommu->ctx_lowest_free = 1;
 893        iommu->tbl.table_map_base = dma_offset;
 894        iommu->dma_addr_mask = dma_mask;
 895
 896        /* Allocate and initialize the free area map.  */
 897        sz = (num_tsb_entries + 7) / 8;
 898        sz = (sz + 7UL) & ~7UL;
 899        iommu->tbl.map = kzalloc(sz, GFP_KERNEL);
 900        if (!iommu->tbl.map) {
 901                printk(KERN_ERR PFX "Error, kmalloc(arena.map) failed.\n");
 902                return -ENOMEM;
 903        }
 904        iommu_tbl_pool_init(&iommu->tbl, num_tsb_entries, IO_PAGE_SHIFT,
 905                            NULL, false /* no large_pool */,
 906                            0 /* default npools */,
 907                            false /* want span boundary checking */);
 908        sz = probe_existing_entries(pbm, &iommu->tbl);
 909        if (sz)
 910                printk("%s: Imported %lu TSB entries from OBP\n",
 911                       pbm->name, sz);
 912
 913        return 0;
 914}
 915
 916#ifdef CONFIG_PCI_MSI
 917struct pci_sun4v_msiq_entry {
 918        u64             version_type;
 919#define MSIQ_VERSION_MASK               0xffffffff00000000UL
 920#define MSIQ_VERSION_SHIFT              32
 921#define MSIQ_TYPE_MASK                  0x00000000000000ffUL
 922#define MSIQ_TYPE_SHIFT                 0
 923#define MSIQ_TYPE_NONE                  0x00
 924#define MSIQ_TYPE_MSG                   0x01
 925#define MSIQ_TYPE_MSI32                 0x02
 926#define MSIQ_TYPE_MSI64                 0x03
 927#define MSIQ_TYPE_INTX                  0x08
 928#define MSIQ_TYPE_NONE2                 0xff
 929
 930        u64             intx_sysino;
 931        u64             reserved1;
 932        u64             stick;
 933        u64             req_id;  /* bus/device/func */
 934#define MSIQ_REQID_BUS_MASK             0xff00UL
 935#define MSIQ_REQID_BUS_SHIFT            8
 936#define MSIQ_REQID_DEVICE_MASK          0x00f8UL
 937#define MSIQ_REQID_DEVICE_SHIFT         3
 938#define MSIQ_REQID_FUNC_MASK            0x0007UL
 939#define MSIQ_REQID_FUNC_SHIFT           0
 940
 941        u64             msi_address;
 942
 943        /* The format of this value is message type dependent.
 944         * For MSI bits 15:0 are the data from the MSI packet.
 945         * For MSI-X bits 31:0 are the data from the MSI packet.
 946         * For MSG, the message code and message routing code where:
 947         *      bits 39:32 is the bus/device/fn of the msg target-id
 948         *      bits 18:16 is the message routing code
 949         *      bits 7:0 is the message code
 950         * For INTx the low order 2-bits are:
 951         *      00 - INTA
 952         *      01 - INTB
 953         *      10 - INTC
 954         *      11 - INTD
 955         */
 956        u64             msi_data;
 957
 958        u64             reserved2;
 959};
 960
 961static int pci_sun4v_get_head(struct pci_pbm_info *pbm, unsigned long msiqid,
 962                              unsigned long *head)
 963{
 964        unsigned long err, limit;
 965
 966        err = pci_sun4v_msiq_gethead(pbm->devhandle, msiqid, head);
 967        if (unlikely(err))
 968                return -ENXIO;
 969
 970        limit = pbm->msiq_ent_count * sizeof(struct pci_sun4v_msiq_entry);
 971        if (unlikely(*head >= limit))
 972                return -EFBIG;
 973
 974        return 0;
 975}
 976
 977static int pci_sun4v_dequeue_msi(struct pci_pbm_info *pbm,
 978                                 unsigned long msiqid, unsigned long *head,
 979                                 unsigned long *msi)
 980{
 981        struct pci_sun4v_msiq_entry *ep;
 982        unsigned long err, type;
 983
 984        /* Note: void pointer arithmetic, 'head' is a byte offset  */
 985        ep = (pbm->msi_queues + ((msiqid - pbm->msiq_first) *
 986                                 (pbm->msiq_ent_count *
 987                                  sizeof(struct pci_sun4v_msiq_entry))) +
 988              *head);
 989
 990        if ((ep->version_type & MSIQ_TYPE_MASK) == 0)
 991                return 0;
 992
 993        type = (ep->version_type & MSIQ_TYPE_MASK) >> MSIQ_TYPE_SHIFT;
 994        if (unlikely(type != MSIQ_TYPE_MSI32 &&
 995                     type != MSIQ_TYPE_MSI64))
 996                return -EINVAL;
 997
 998        *msi = ep->msi_data;
 999
1000        err = pci_sun4v_msi_setstate(pbm->devhandle,
1001                                     ep->msi_data /* msi_num */,
1002                                     HV_MSISTATE_IDLE);
1003        if (unlikely(err))
1004                return -ENXIO;
1005
1006        /* Clear the entry.  */
1007        ep->version_type &= ~MSIQ_TYPE_MASK;
1008
1009        (*head) += sizeof(struct pci_sun4v_msiq_entry);
1010        if (*head >=
1011            (pbm->msiq_ent_count * sizeof(struct pci_sun4v_msiq_entry)))
1012                *head = 0;
1013
1014        return 1;
1015}
1016
1017static int pci_sun4v_set_head(struct pci_pbm_info *pbm, unsigned long msiqid,
1018                              unsigned long head)
1019{
1020        unsigned long err;
1021
1022        err = pci_sun4v_msiq_sethead(pbm->devhandle, msiqid, head);
1023        if (unlikely(err))
1024                return -EINVAL;
1025
1026        return 0;
1027}
1028
1029static int pci_sun4v_msi_setup(struct pci_pbm_info *pbm, unsigned long msiqid,
1030                               unsigned long msi, int is_msi64)
1031{
1032        if (pci_sun4v_msi_setmsiq(pbm->devhandle, msi, msiqid,
1033                                  (is_msi64 ?
1034                                   HV_MSITYPE_MSI64 : HV_MSITYPE_MSI32)))
1035                return -ENXIO;
1036        if (pci_sun4v_msi_setstate(pbm->devhandle, msi, HV_MSISTATE_IDLE))
1037                return -ENXIO;
1038        if (pci_sun4v_msi_setvalid(pbm->devhandle, msi, HV_MSIVALID_VALID))
1039                return -ENXIO;
1040        return 0;
1041}
1042
1043static int pci_sun4v_msi_teardown(struct pci_pbm_info *pbm, unsigned long msi)
1044{
1045        unsigned long err, msiqid;
1046
1047        err = pci_sun4v_msi_getmsiq(pbm->devhandle, msi, &msiqid);
1048        if (err)
1049                return -ENXIO;
1050
1051        pci_sun4v_msi_setvalid(pbm->devhandle, msi, HV_MSIVALID_INVALID);
1052
1053        return 0;
1054}
1055
1056static int pci_sun4v_msiq_alloc(struct pci_pbm_info *pbm)
1057{
1058        unsigned long q_size, alloc_size, pages, order;
1059        int i;
1060
1061        q_size = pbm->msiq_ent_count * sizeof(struct pci_sun4v_msiq_entry);
1062        alloc_size = (pbm->msiq_num * q_size);
1063        order = get_order(alloc_size);
1064        pages = __get_free_pages(GFP_KERNEL | __GFP_COMP, order);
1065        if (pages == 0UL) {
1066                printk(KERN_ERR "MSI: Cannot allocate MSI queues (o=%lu).\n",
1067                       order);
1068                return -ENOMEM;
1069        }
1070        memset((char *)pages, 0, PAGE_SIZE << order);
1071        pbm->msi_queues = (void *) pages;
1072
1073        for (i = 0; i < pbm->msiq_num; i++) {
1074                unsigned long err, base = __pa(pages + (i * q_size));
1075                unsigned long ret1, ret2;
1076
1077                err = pci_sun4v_msiq_conf(pbm->devhandle,
1078                                          pbm->msiq_first + i,
1079                                          base, pbm->msiq_ent_count);
1080                if (err) {
1081                        printk(KERN_ERR "MSI: msiq register fails (err=%lu)\n",
1082                               err);
1083                        goto h_error;
1084                }
1085
1086                err = pci_sun4v_msiq_info(pbm->devhandle,
1087                                          pbm->msiq_first + i,
1088                                          &ret1, &ret2);
1089                if (err) {
1090                        printk(KERN_ERR "MSI: Cannot read msiq (err=%lu)\n",
1091                               err);
1092                        goto h_error;
1093                }
1094                if (ret1 != base || ret2 != pbm->msiq_ent_count) {
1095                        printk(KERN_ERR "MSI: Bogus qconf "
1096                               "expected[%lx:%x] got[%lx:%lx]\n",
1097                               base, pbm->msiq_ent_count,
1098                               ret1, ret2);
1099                        goto h_error;
1100                }
1101        }
1102
1103        return 0;
1104
1105h_error:
1106        free_pages(pages, order);
1107        return -EINVAL;
1108}
1109
1110static void pci_sun4v_msiq_free(struct pci_pbm_info *pbm)
1111{
1112        unsigned long q_size, alloc_size, pages, order;
1113        int i;
1114
1115        for (i = 0; i < pbm->msiq_num; i++) {
1116                unsigned long msiqid = pbm->msiq_first + i;
1117
1118                (void) pci_sun4v_msiq_conf(pbm->devhandle, msiqid, 0UL, 0);
1119        }
1120
1121        q_size = pbm->msiq_ent_count * sizeof(struct pci_sun4v_msiq_entry);
1122        alloc_size = (pbm->msiq_num * q_size);
1123        order = get_order(alloc_size);
1124
1125        pages = (unsigned long) pbm->msi_queues;
1126
1127        free_pages(pages, order);
1128
1129        pbm->msi_queues = NULL;
1130}
1131
1132static int pci_sun4v_msiq_build_irq(struct pci_pbm_info *pbm,
1133                                    unsigned long msiqid,
1134                                    unsigned long devino)
1135{
1136        unsigned int irq = sun4v_build_irq(pbm->devhandle, devino);
1137
1138        if (!irq)
1139                return -ENOMEM;
1140
1141        if (pci_sun4v_msiq_setvalid(pbm->devhandle, msiqid, HV_MSIQ_VALID))
1142                return -EINVAL;
1143        if (pci_sun4v_msiq_setstate(pbm->devhandle, msiqid, HV_MSIQSTATE_IDLE))
1144                return -EINVAL;
1145
1146        return irq;
1147}
1148
1149static const struct sparc64_msiq_ops pci_sun4v_msiq_ops = {
1150        .get_head       =       pci_sun4v_get_head,
1151        .dequeue_msi    =       pci_sun4v_dequeue_msi,
1152        .set_head       =       pci_sun4v_set_head,
1153        .msi_setup      =       pci_sun4v_msi_setup,
1154        .msi_teardown   =       pci_sun4v_msi_teardown,
1155        .msiq_alloc     =       pci_sun4v_msiq_alloc,
1156        .msiq_free      =       pci_sun4v_msiq_free,
1157        .msiq_build_irq =       pci_sun4v_msiq_build_irq,
1158};
1159
1160static void pci_sun4v_msi_init(struct pci_pbm_info *pbm)
1161{
1162        sparc64_pbm_msi_init(pbm, &pci_sun4v_msiq_ops);
1163}
1164#else /* CONFIG_PCI_MSI */
1165static void pci_sun4v_msi_init(struct pci_pbm_info *pbm)
1166{
1167}
1168#endif /* !(CONFIG_PCI_MSI) */
1169
1170static int pci_sun4v_pbm_init(struct pci_pbm_info *pbm,
1171                              struct platform_device *op, u32 devhandle)
1172{
1173        struct device_node *dp = op->dev.of_node;
1174        int err;
1175
1176        pbm->numa_node = of_node_to_nid(dp);
1177
1178        pbm->pci_ops = &sun4v_pci_ops;
1179        pbm->config_space_reg_bits = 12;
1180
1181        pbm->index = pci_num_pbms++;
1182
1183        pbm->op = op;
1184
1185        pbm->devhandle = devhandle;
1186
1187        pbm->name = dp->full_name;
1188
1189        printk("%s: SUN4V PCI Bus Module\n", pbm->name);
1190        printk("%s: On NUMA node %d\n", pbm->name, pbm->numa_node);
1191
1192        pci_determine_mem_io_space(pbm);
1193
1194        pci_get_pbm_props(pbm);
1195
1196        err = pci_sun4v_iommu_init(pbm);
1197        if (err)
1198                return err;
1199
1200        pci_sun4v_msi_init(pbm);
1201
1202        pci_sun4v_scan_bus(pbm, &op->dev);
1203
1204        /* if atu_init fails its not complete failure.
1205         * we can still continue using legacy iommu.
1206         */
1207        if (pbm->iommu->atu) {
1208                err = pci_sun4v_atu_init(pbm);
1209                if (err) {
1210                        kfree(pbm->iommu->atu);
1211                        pbm->iommu->atu = NULL;
1212                        pr_err(PFX "ATU init failed, err=%d\n", err);
1213                }
1214        }
1215
1216        pbm->next = pci_pbm_root;
1217        pci_pbm_root = pbm;
1218
1219        return 0;
1220}
1221
1222static int pci_sun4v_probe(struct platform_device *op)
1223{
1224        const struct linux_prom64_registers *regs;
1225        static int hvapi_negotiated = 0;
1226        struct pci_pbm_info *pbm;
1227        struct device_node *dp;
1228        struct iommu *iommu;
1229        struct atu *atu;
1230        u32 devhandle;
1231        int i, err = -ENODEV;
1232        static bool hv_atu = true;
1233
1234        dp = op->dev.of_node;
1235
1236        if (!hvapi_negotiated++) {
1237                for (i = 0; i < ARRAY_SIZE(vpci_versions); i++) {
1238                        vpci_major = vpci_versions[i].major;
1239                        vpci_minor = vpci_versions[i].minor;
1240
1241                        err = sun4v_hvapi_register(HV_GRP_PCI, vpci_major,
1242                                                   &vpci_minor);
1243                        if (!err)
1244                                break;
1245                }
1246
1247                if (err) {
1248                        pr_err(PFX "Could not register hvapi, err=%d\n", err);
1249                        return err;
1250                }
1251                pr_info(PFX "Registered hvapi major[%lu] minor[%lu]\n",
1252                        vpci_major, vpci_minor);
1253
1254                err = sun4v_hvapi_register(HV_GRP_ATU, vatu_major, &vatu_minor);
1255                if (err) {
1256                        /* don't return an error if we fail to register the
1257                         * ATU group, but ATU hcalls won't be available.
1258                         */
1259                        hv_atu = false;
1260                } else {
1261                        pr_info(PFX "Registered hvapi ATU major[%lu] minor[%lu]\n",
1262                                vatu_major, vatu_minor);
1263                }
1264
1265                dma_ops = &sun4v_dma_ops;
1266        }
1267
1268        regs = of_get_property(dp, "reg", NULL);
1269        err = -ENODEV;
1270        if (!regs) {
1271                printk(KERN_ERR PFX "Could not find config registers\n");
1272                goto out_err;
1273        }
1274        devhandle = (regs->phys_addr >> 32UL) & 0x0fffffff;
1275
1276        err = -ENOMEM;
1277        if (!iommu_batch_initialized) {
1278                for_each_possible_cpu(i) {
1279                        unsigned long page = get_zeroed_page(GFP_KERNEL);
1280
1281                        if (!page)
1282                                goto out_err;
1283
1284                        per_cpu(iommu_batch, i).pglist = (u64 *) page;
1285                }
1286                iommu_batch_initialized = 1;
1287        }
1288
1289        pbm = kzalloc(sizeof(*pbm), GFP_KERNEL);
1290        if (!pbm) {
1291                printk(KERN_ERR PFX "Could not allocate pci_pbm_info\n");
1292                goto out_err;
1293        }
1294
1295        iommu = kzalloc(sizeof(struct iommu), GFP_KERNEL);
1296        if (!iommu) {
1297                printk(KERN_ERR PFX "Could not allocate pbm iommu\n");
1298                goto out_free_controller;
1299        }
1300
1301        pbm->iommu = iommu;
1302        iommu->atu = NULL;
1303        if (hv_atu) {
1304                atu = kzalloc(sizeof(*atu), GFP_KERNEL);
1305                if (!atu)
1306                        pr_err(PFX "Could not allocate atu\n");
1307                else
1308                        iommu->atu = atu;
1309        }
1310
1311        err = pci_sun4v_pbm_init(pbm, op, devhandle);
1312        if (err)
1313                goto out_free_iommu;
1314
1315        dev_set_drvdata(&op->dev, pbm);
1316
1317        return 0;
1318
1319out_free_iommu:
1320        kfree(iommu->atu);
1321        kfree(pbm->iommu);
1322
1323out_free_controller:
1324        kfree(pbm);
1325
1326out_err:
1327        return err;
1328}
1329
1330static const struct of_device_id pci_sun4v_match[] = {
1331        {
1332                .name = "pci",
1333                .compatible = "SUNW,sun4v-pci",
1334        },
1335        {},
1336};
1337
1338static struct platform_driver pci_sun4v_driver = {
1339        .driver = {
1340                .name = DRIVER_NAME,
1341                .of_match_table = pci_sun4v_match,
1342        },
1343        .probe          = pci_sun4v_probe,
1344};
1345
1346static int __init pci_sun4v_init(void)
1347{
1348        return platform_driver_register(&pci_sun4v_driver);
1349}
1350
1351subsys_initcall(pci_sun4v_init);
1352