linux/drivers/net/ethernet/ibm/ibmveth.c
<<
>>
Prefs
   1/*
   2 * IBM Power Virtual Ethernet Device Driver
   3 *
   4 * This program is free software; you can redistribute it and/or modify
   5 * it under the terms of the GNU General Public License as published by
   6 * the Free Software Foundation; either version 2 of the License, or
   7 * (at your option) any later version.
   8 *
   9 * This program is distributed in the hope that it will be useful,
  10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  12 * GNU General Public License for more details.
  13 *
  14 * You should have received a copy of the GNU General Public License
  15 * along with this program; if not, write to the Free Software
  16 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
  17 *
  18 * Copyright (C) IBM Corporation, 2003, 2010
  19 *
  20 * Authors: Dave Larson <larson1@us.ibm.com>
  21 *          Santiago Leon <santil@linux.vnet.ibm.com>
  22 *          Brian King <brking@linux.vnet.ibm.com>
  23 *          Robert Jennings <rcj@linux.vnet.ibm.com>
  24 *          Anton Blanchard <anton@au.ibm.com>
  25 */
  26
  27#include <linux/module.h>
  28#include <linux/moduleparam.h>
  29#include <linux/types.h>
  30#include <linux/errno.h>
  31#include <linux/dma-mapping.h>
  32#include <linux/kernel.h>
  33#include <linux/netdevice.h>
  34#include <linux/etherdevice.h>
  35#include <linux/skbuff.h>
  36#include <linux/init.h>
  37#include <linux/interrupt.h>
  38#include <linux/mm.h>
  39#include <linux/pm.h>
  40#include <linux/ethtool.h>
  41#include <linux/in.h>
  42#include <linux/ip.h>
  43#include <linux/ipv6.h>
  44#include <linux/slab.h>
  45#include <asm/hvcall.h>
  46#include <linux/atomic.h>
  47#include <asm/vio.h>
  48#include <asm/iommu.h>
  49#include <asm/firmware.h>
  50
  51#include "ibmveth.h"
  52
  53static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance);
  54static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter);
  55static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev);
  56
  57static struct kobj_type ktype_veth_pool;
  58
  59
  60static const char ibmveth_driver_name[] = "ibmveth";
  61static const char ibmveth_driver_string[] = "IBM Power Virtual Ethernet Driver";
  62#define ibmveth_driver_version "1.04"
  63
  64MODULE_AUTHOR("Santiago Leon <santil@linux.vnet.ibm.com>");
  65MODULE_DESCRIPTION("IBM Power Virtual Ethernet Driver");
  66MODULE_LICENSE("GPL");
  67MODULE_VERSION(ibmveth_driver_version);
  68
  69static unsigned int tx_copybreak __read_mostly = 128;
  70module_param(tx_copybreak, uint, 0644);
  71MODULE_PARM_DESC(tx_copybreak,
  72        "Maximum size of packet that is copied to a new buffer on transmit");
  73
  74static unsigned int rx_copybreak __read_mostly = 128;
  75module_param(rx_copybreak, uint, 0644);
  76MODULE_PARM_DESC(rx_copybreak,
  77        "Maximum size of packet that is copied to a new buffer on receive");
  78
  79static unsigned int rx_flush __read_mostly = 0;
  80module_param(rx_flush, uint, 0644);
  81MODULE_PARM_DESC(rx_flush, "Flush receive buffers before use");
  82
  83struct ibmveth_stat {
  84        char name[ETH_GSTRING_LEN];
  85        int offset;
  86};
  87
  88#define IBMVETH_STAT_OFF(stat) offsetof(struct ibmveth_adapter, stat)
  89#define IBMVETH_GET_STAT(a, off) *((u64 *)(((unsigned long)(a)) + off))
  90
  91struct ibmveth_stat ibmveth_stats[] = {
  92        { "replenish_task_cycles", IBMVETH_STAT_OFF(replenish_task_cycles) },
  93        { "replenish_no_mem", IBMVETH_STAT_OFF(replenish_no_mem) },
  94        { "replenish_add_buff_failure",
  95                        IBMVETH_STAT_OFF(replenish_add_buff_failure) },
  96        { "replenish_add_buff_success",
  97                        IBMVETH_STAT_OFF(replenish_add_buff_success) },
  98        { "rx_invalid_buffer", IBMVETH_STAT_OFF(rx_invalid_buffer) },
  99        { "rx_no_buffer", IBMVETH_STAT_OFF(rx_no_buffer) },
 100        { "tx_map_failed", IBMVETH_STAT_OFF(tx_map_failed) },
 101        { "tx_send_failed", IBMVETH_STAT_OFF(tx_send_failed) },
 102        { "fw_enabled_ipv4_csum", IBMVETH_STAT_OFF(fw_ipv4_csum_support) },
 103        { "fw_enabled_ipv6_csum", IBMVETH_STAT_OFF(fw_ipv6_csum_support) },
 104};
 105
 106/* simple methods of getting data from the current rxq entry */
 107static inline u32 ibmveth_rxq_flags(struct ibmveth_adapter *adapter)
 108{
 109        return adapter->rx_queue.queue_addr[adapter->rx_queue.index].flags_off;
 110}
 111
 112static inline int ibmveth_rxq_toggle(struct ibmveth_adapter *adapter)
 113{
 114        return (ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_TOGGLE) >>
 115                        IBMVETH_RXQ_TOGGLE_SHIFT;
 116}
 117
 118static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
 119{
 120        return ibmveth_rxq_toggle(adapter) == adapter->rx_queue.toggle;
 121}
 122
 123static inline int ibmveth_rxq_buffer_valid(struct ibmveth_adapter *adapter)
 124{
 125        return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_VALID;
 126}
 127
 128static inline int ibmveth_rxq_frame_offset(struct ibmveth_adapter *adapter)
 129{
 130        return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_OFF_MASK;
 131}
 132
 133static inline int ibmveth_rxq_frame_length(struct ibmveth_adapter *adapter)
 134{
 135        return adapter->rx_queue.queue_addr[adapter->rx_queue.index].length;
 136}
 137
 138static inline int ibmveth_rxq_csum_good(struct ibmveth_adapter *adapter)
 139{
 140        return ibmveth_rxq_flags(adapter) & IBMVETH_RXQ_CSUM_GOOD;
 141}
 142
 143/* setup the initial settings for a buffer pool */
 144static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool,
 145                                     u32 pool_index, u32 pool_size,
 146                                     u32 buff_size, u32 pool_active)
 147{
 148        pool->size = pool_size;
 149        pool->index = pool_index;
 150        pool->buff_size = buff_size;
 151        pool->threshold = pool_size * 7 / 8;
 152        pool->active = pool_active;
 153}
 154
 155/* allocate and setup an buffer pool - called during open */
 156static int ibmveth_alloc_buffer_pool(struct ibmveth_buff_pool *pool)
 157{
 158        int i;
 159
 160        pool->free_map = kmalloc(sizeof(u16) * pool->size, GFP_KERNEL);
 161
 162        if (!pool->free_map)
 163                return -1;
 164
 165        pool->dma_addr = kmalloc(sizeof(dma_addr_t) * pool->size, GFP_KERNEL);
 166        if (!pool->dma_addr) {
 167                kfree(pool->free_map);
 168                pool->free_map = NULL;
 169                return -1;
 170        }
 171
 172        pool->skbuff = kcalloc(pool->size, sizeof(void *), GFP_KERNEL);
 173
 174        if (!pool->skbuff) {
 175                kfree(pool->dma_addr);
 176                pool->dma_addr = NULL;
 177
 178                kfree(pool->free_map);
 179                pool->free_map = NULL;
 180                return -1;
 181        }
 182
 183        memset(pool->dma_addr, 0, sizeof(dma_addr_t) * pool->size);
 184
 185        for (i = 0; i < pool->size; ++i)
 186                pool->free_map[i] = i;
 187
 188        atomic_set(&pool->available, 0);
 189        pool->producer_index = 0;
 190        pool->consumer_index = 0;
 191
 192        return 0;
 193}
 194
 195static inline void ibmveth_flush_buffer(void *addr, unsigned long length)
 196{
 197        unsigned long offset;
 198
 199        for (offset = 0; offset < length; offset += SMP_CACHE_BYTES)
 200                asm("dcbfl %0,%1" :: "b" (addr), "r" (offset));
 201}
 202
 203/* replenish the buffers for a pool.  note that we don't need to
 204 * skb_reserve these since they are used for incoming...
 205 */
 206static void ibmveth_replenish_buffer_pool(struct ibmveth_adapter *adapter,
 207                                          struct ibmveth_buff_pool *pool)
 208{
 209        u32 i;
 210        u32 count = pool->size - atomic_read(&pool->available);
 211        u32 buffers_added = 0;
 212        struct sk_buff *skb;
 213        unsigned int free_index, index;
 214        u64 correlator;
 215        unsigned long lpar_rc;
 216        dma_addr_t dma_addr;
 217
 218        mb();
 219
 220        for (i = 0; i < count; ++i) {
 221                union ibmveth_buf_desc desc;
 222
 223                skb = netdev_alloc_skb(adapter->netdev, pool->buff_size);
 224
 225                if (!skb) {
 226                        netdev_dbg(adapter->netdev,
 227                                   "replenish: unable to allocate skb\n");
 228                        adapter->replenish_no_mem++;
 229                        break;
 230                }
 231
 232                free_index = pool->consumer_index;
 233                pool->consumer_index++;
 234                if (pool->consumer_index >= pool->size)
 235                        pool->consumer_index = 0;
 236                index = pool->free_map[free_index];
 237
 238                BUG_ON(index == IBM_VETH_INVALID_MAP);
 239                BUG_ON(pool->skbuff[index] != NULL);
 240
 241                dma_addr = dma_map_single(&adapter->vdev->dev, skb->data,
 242                                pool->buff_size, DMA_FROM_DEVICE);
 243
 244                if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
 245                        goto failure;
 246
 247                pool->free_map[free_index] = IBM_VETH_INVALID_MAP;
 248                pool->dma_addr[index] = dma_addr;
 249                pool->skbuff[index] = skb;
 250
 251                correlator = ((u64)pool->index << 32) | index;
 252                *(u64 *)skb->data = correlator;
 253
 254                desc.fields.flags_len = IBMVETH_BUF_VALID | pool->buff_size;
 255                desc.fields.address = dma_addr;
 256
 257                if (rx_flush) {
 258                        unsigned int len = min(pool->buff_size,
 259                                                adapter->netdev->mtu +
 260                                                IBMVETH_BUFF_OH);
 261                        ibmveth_flush_buffer(skb->data, len);
 262                }
 263                lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address,
 264                                                   desc.desc);
 265
 266                if (lpar_rc != H_SUCCESS) {
 267                        goto failure;
 268                } else {
 269                        buffers_added++;
 270                        adapter->replenish_add_buff_success++;
 271                }
 272        }
 273
 274        mb();
 275        atomic_add(buffers_added, &(pool->available));
 276        return;
 277
 278failure:
 279        pool->free_map[free_index] = index;
 280        pool->skbuff[index] = NULL;
 281        if (pool->consumer_index == 0)
 282                pool->consumer_index = pool->size - 1;
 283        else
 284                pool->consumer_index--;
 285        if (!dma_mapping_error(&adapter->vdev->dev, dma_addr))
 286                dma_unmap_single(&adapter->vdev->dev,
 287                                 pool->dma_addr[index], pool->buff_size,
 288                                 DMA_FROM_DEVICE);
 289        dev_kfree_skb_any(skb);
 290        adapter->replenish_add_buff_failure++;
 291
 292        mb();
 293        atomic_add(buffers_added, &(pool->available));
 294}
 295
 296/* replenish routine */
 297static void ibmveth_replenish_task(struct ibmveth_adapter *adapter)
 298{
 299        int i;
 300
 301        adapter->replenish_task_cycles++;
 302
 303        for (i = (IBMVETH_NUM_BUFF_POOLS - 1); i >= 0; i--) {
 304                struct ibmveth_buff_pool *pool = &adapter->rx_buff_pool[i];
 305
 306                if (pool->active &&
 307                    (atomic_read(&pool->available) < pool->threshold))
 308                        ibmveth_replenish_buffer_pool(adapter, pool);
 309        }
 310
 311        adapter->rx_no_buffer = *(u64 *)(((char*)adapter->buffer_list_addr) +
 312                                                4096 - 8);
 313}
 314
 315/* empty and free ana buffer pool - also used to do cleanup in error paths */
 316static void ibmveth_free_buffer_pool(struct ibmveth_adapter *adapter,
 317                                     struct ibmveth_buff_pool *pool)
 318{
 319        int i;
 320
 321        kfree(pool->free_map);
 322        pool->free_map = NULL;
 323
 324        if (pool->skbuff && pool->dma_addr) {
 325                for (i = 0; i < pool->size; ++i) {
 326                        struct sk_buff *skb = pool->skbuff[i];
 327                        if (skb) {
 328                                dma_unmap_single(&adapter->vdev->dev,
 329                                                 pool->dma_addr[i],
 330                                                 pool->buff_size,
 331                                                 DMA_FROM_DEVICE);
 332                                dev_kfree_skb_any(skb);
 333                                pool->skbuff[i] = NULL;
 334                        }
 335                }
 336        }
 337
 338        if (pool->dma_addr) {
 339                kfree(pool->dma_addr);
 340                pool->dma_addr = NULL;
 341        }
 342
 343        if (pool->skbuff) {
 344                kfree(pool->skbuff);
 345                pool->skbuff = NULL;
 346        }
 347}
 348
 349/* remove a buffer from a pool */
 350static void ibmveth_remove_buffer_from_pool(struct ibmveth_adapter *adapter,
 351                                            u64 correlator)
 352{
 353        unsigned int pool  = correlator >> 32;
 354        unsigned int index = correlator & 0xffffffffUL;
 355        unsigned int free_index;
 356        struct sk_buff *skb;
 357
 358        BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
 359        BUG_ON(index >= adapter->rx_buff_pool[pool].size);
 360
 361        skb = adapter->rx_buff_pool[pool].skbuff[index];
 362
 363        BUG_ON(skb == NULL);
 364
 365        adapter->rx_buff_pool[pool].skbuff[index] = NULL;
 366
 367        dma_unmap_single(&adapter->vdev->dev,
 368                         adapter->rx_buff_pool[pool].dma_addr[index],
 369                         adapter->rx_buff_pool[pool].buff_size,
 370                         DMA_FROM_DEVICE);
 371
 372        free_index = adapter->rx_buff_pool[pool].producer_index;
 373        adapter->rx_buff_pool[pool].producer_index++;
 374        if (adapter->rx_buff_pool[pool].producer_index >=
 375            adapter->rx_buff_pool[pool].size)
 376                adapter->rx_buff_pool[pool].producer_index = 0;
 377        adapter->rx_buff_pool[pool].free_map[free_index] = index;
 378
 379        mb();
 380
 381        atomic_dec(&(adapter->rx_buff_pool[pool].available));
 382}
 383
 384/* get the current buffer on the rx queue */
 385static inline struct sk_buff *ibmveth_rxq_get_buffer(struct ibmveth_adapter *adapter)
 386{
 387        u64 correlator = adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator;
 388        unsigned int pool = correlator >> 32;
 389        unsigned int index = correlator & 0xffffffffUL;
 390
 391        BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
 392        BUG_ON(index >= adapter->rx_buff_pool[pool].size);
 393
 394        return adapter->rx_buff_pool[pool].skbuff[index];
 395}
 396
 397/* recycle the current buffer on the rx queue */
 398static int ibmveth_rxq_recycle_buffer(struct ibmveth_adapter *adapter)
 399{
 400        u32 q_index = adapter->rx_queue.index;
 401        u64 correlator = adapter->rx_queue.queue_addr[q_index].correlator;
 402        unsigned int pool = correlator >> 32;
 403        unsigned int index = correlator & 0xffffffffUL;
 404        union ibmveth_buf_desc desc;
 405        unsigned long lpar_rc;
 406        int ret = 1;
 407
 408        BUG_ON(pool >= IBMVETH_NUM_BUFF_POOLS);
 409        BUG_ON(index >= adapter->rx_buff_pool[pool].size);
 410
 411        if (!adapter->rx_buff_pool[pool].active) {
 412                ibmveth_rxq_harvest_buffer(adapter);
 413                ibmveth_free_buffer_pool(adapter, &adapter->rx_buff_pool[pool]);
 414                goto out;
 415        }
 416
 417        desc.fields.flags_len = IBMVETH_BUF_VALID |
 418                adapter->rx_buff_pool[pool].buff_size;
 419        desc.fields.address = adapter->rx_buff_pool[pool].dma_addr[index];
 420
 421        lpar_rc = h_add_logical_lan_buffer(adapter->vdev->unit_address, desc.desc);
 422
 423        if (lpar_rc != H_SUCCESS) {
 424                netdev_dbg(adapter->netdev, "h_add_logical_lan_buffer failed "
 425                           "during recycle rc=%ld", lpar_rc);
 426                ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
 427                ret = 0;
 428        }
 429
 430        if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
 431                adapter->rx_queue.index = 0;
 432                adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
 433        }
 434
 435out:
 436        return ret;
 437}
 438
 439static void ibmveth_rxq_harvest_buffer(struct ibmveth_adapter *adapter)
 440{
 441        ibmveth_remove_buffer_from_pool(adapter, adapter->rx_queue.queue_addr[adapter->rx_queue.index].correlator);
 442
 443        if (++adapter->rx_queue.index == adapter->rx_queue.num_slots) {
 444                adapter->rx_queue.index = 0;
 445                adapter->rx_queue.toggle = !adapter->rx_queue.toggle;
 446        }
 447}
 448
 449static void ibmveth_cleanup(struct ibmveth_adapter *adapter)
 450{
 451        int i;
 452        struct device *dev = &adapter->vdev->dev;
 453
 454        if (adapter->buffer_list_addr != NULL) {
 455                if (!dma_mapping_error(dev, adapter->buffer_list_dma)) {
 456                        dma_unmap_single(dev, adapter->buffer_list_dma, 4096,
 457                                        DMA_BIDIRECTIONAL);
 458                        adapter->buffer_list_dma = DMA_ERROR_CODE;
 459                }
 460                free_page((unsigned long)adapter->buffer_list_addr);
 461                adapter->buffer_list_addr = NULL;
 462        }
 463
 464        if (adapter->filter_list_addr != NULL) {
 465                if (!dma_mapping_error(dev, adapter->filter_list_dma)) {
 466                        dma_unmap_single(dev, adapter->filter_list_dma, 4096,
 467                                        DMA_BIDIRECTIONAL);
 468                        adapter->filter_list_dma = DMA_ERROR_CODE;
 469                }
 470                free_page((unsigned long)adapter->filter_list_addr);
 471                adapter->filter_list_addr = NULL;
 472        }
 473
 474        if (adapter->rx_queue.queue_addr != NULL) {
 475                dma_free_coherent(dev, adapter->rx_queue.queue_len,
 476                                  adapter->rx_queue.queue_addr,
 477                                  adapter->rx_queue.queue_dma);
 478                adapter->rx_queue.queue_addr = NULL;
 479        }
 480
 481        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
 482                if (adapter->rx_buff_pool[i].active)
 483                        ibmveth_free_buffer_pool(adapter,
 484                                                 &adapter->rx_buff_pool[i]);
 485
 486        if (adapter->bounce_buffer != NULL) {
 487                if (!dma_mapping_error(dev, adapter->bounce_buffer_dma)) {
 488                        dma_unmap_single(&adapter->vdev->dev,
 489                                        adapter->bounce_buffer_dma,
 490                                        adapter->netdev->mtu + IBMVETH_BUFF_OH,
 491                                        DMA_BIDIRECTIONAL);
 492                        adapter->bounce_buffer_dma = DMA_ERROR_CODE;
 493                }
 494                kfree(adapter->bounce_buffer);
 495                adapter->bounce_buffer = NULL;
 496        }
 497}
 498
 499static int ibmveth_register_logical_lan(struct ibmveth_adapter *adapter,
 500        union ibmveth_buf_desc rxq_desc, u64 mac_address)
 501{
 502        int rc, try_again = 1;
 503
 504        /*
 505         * After a kexec the adapter will still be open, so our attempt to
 506         * open it will fail. So if we get a failure we free the adapter and
 507         * try again, but only once.
 508         */
 509retry:
 510        rc = h_register_logical_lan(adapter->vdev->unit_address,
 511                                    adapter->buffer_list_dma, rxq_desc.desc,
 512                                    adapter->filter_list_dma, mac_address);
 513
 514        if (rc != H_SUCCESS && try_again) {
 515                do {
 516                        rc = h_free_logical_lan(adapter->vdev->unit_address);
 517                } while (H_IS_LONG_BUSY(rc) || (rc == H_BUSY));
 518
 519                try_again = 0;
 520                goto retry;
 521        }
 522
 523        return rc;
 524}
 525
 526static int ibmveth_open(struct net_device *netdev)
 527{
 528        struct ibmveth_adapter *adapter = netdev_priv(netdev);
 529        u64 mac_address = 0;
 530        int rxq_entries = 1;
 531        unsigned long lpar_rc;
 532        int rc;
 533        union ibmveth_buf_desc rxq_desc;
 534        int i;
 535        struct device *dev;
 536
 537        netdev_dbg(netdev, "open starting\n");
 538
 539        napi_enable(&adapter->napi);
 540
 541        for(i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
 542                rxq_entries += adapter->rx_buff_pool[i].size;
 543
 544        adapter->buffer_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
 545        adapter->filter_list_addr = (void*) get_zeroed_page(GFP_KERNEL);
 546
 547        if (!adapter->buffer_list_addr || !adapter->filter_list_addr) {
 548                netdev_err(netdev, "unable to allocate filter or buffer list "
 549                           "pages\n");
 550                rc = -ENOMEM;
 551                goto err_out;
 552        }
 553
 554        dev = &adapter->vdev->dev;
 555
 556        adapter->rx_queue.queue_len = sizeof(struct ibmveth_rx_q_entry) *
 557                                                rxq_entries;
 558        adapter->rx_queue.queue_addr =
 559                dma_alloc_coherent(dev, adapter->rx_queue.queue_len,
 560                                   &adapter->rx_queue.queue_dma, GFP_KERNEL);
 561        if (!adapter->rx_queue.queue_addr) {
 562                rc = -ENOMEM;
 563                goto err_out;
 564        }
 565
 566        adapter->buffer_list_dma = dma_map_single(dev,
 567                        adapter->buffer_list_addr, 4096, DMA_BIDIRECTIONAL);
 568        adapter->filter_list_dma = dma_map_single(dev,
 569                        adapter->filter_list_addr, 4096, DMA_BIDIRECTIONAL);
 570
 571        if ((dma_mapping_error(dev, adapter->buffer_list_dma)) ||
 572            (dma_mapping_error(dev, adapter->filter_list_dma))) {
 573                netdev_err(netdev, "unable to map filter or buffer list "
 574                           "pages\n");
 575                rc = -ENOMEM;
 576                goto err_out;
 577        }
 578
 579        adapter->rx_queue.index = 0;
 580        adapter->rx_queue.num_slots = rxq_entries;
 581        adapter->rx_queue.toggle = 1;
 582
 583        memcpy(&mac_address, netdev->dev_addr, netdev->addr_len);
 584        mac_address = mac_address >> 16;
 585
 586        rxq_desc.fields.flags_len = IBMVETH_BUF_VALID |
 587                                        adapter->rx_queue.queue_len;
 588        rxq_desc.fields.address = adapter->rx_queue.queue_dma;
 589
 590        netdev_dbg(netdev, "buffer list @ 0x%p\n", adapter->buffer_list_addr);
 591        netdev_dbg(netdev, "filter list @ 0x%p\n", adapter->filter_list_addr);
 592        netdev_dbg(netdev, "receive q   @ 0x%p\n", adapter->rx_queue.queue_addr);
 593
 594        h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
 595
 596        lpar_rc = ibmveth_register_logical_lan(adapter, rxq_desc, mac_address);
 597
 598        if (lpar_rc != H_SUCCESS) {
 599                netdev_err(netdev, "h_register_logical_lan failed with %ld\n",
 600                           lpar_rc);
 601                netdev_err(netdev, "buffer TCE:0x%llx filter TCE:0x%llx rxq "
 602                           "desc:0x%llx MAC:0x%llx\n",
 603                                     adapter->buffer_list_dma,
 604                                     adapter->filter_list_dma,
 605                                     rxq_desc.desc,
 606                                     mac_address);
 607                rc = -ENONET;
 608                goto err_out;
 609        }
 610
 611        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
 612                if (!adapter->rx_buff_pool[i].active)
 613                        continue;
 614                if (ibmveth_alloc_buffer_pool(&adapter->rx_buff_pool[i])) {
 615                        netdev_err(netdev, "unable to alloc pool\n");
 616                        adapter->rx_buff_pool[i].active = 0;
 617                        rc = -ENOMEM;
 618                        goto err_out;
 619                }
 620        }
 621
 622        netdev_dbg(netdev, "registering irq 0x%x\n", netdev->irq);
 623        rc = request_irq(netdev->irq, ibmveth_interrupt, 0, netdev->name,
 624                         netdev);
 625        if (rc != 0) {
 626                netdev_err(netdev, "unable to request irq 0x%x, rc %d\n",
 627                           netdev->irq, rc);
 628                do {
 629                        lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
 630                } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
 631
 632                goto err_out;
 633        }
 634
 635        adapter->bounce_buffer =
 636            kmalloc(netdev->mtu + IBMVETH_BUFF_OH, GFP_KERNEL);
 637        if (!adapter->bounce_buffer) {
 638                rc = -ENOMEM;
 639                goto err_out_free_irq;
 640        }
 641        adapter->bounce_buffer_dma =
 642            dma_map_single(&adapter->vdev->dev, adapter->bounce_buffer,
 643                           netdev->mtu + IBMVETH_BUFF_OH, DMA_BIDIRECTIONAL);
 644        if (dma_mapping_error(dev, adapter->bounce_buffer_dma)) {
 645                netdev_err(netdev, "unable to map bounce buffer\n");
 646                rc = -ENOMEM;
 647                goto err_out_free_irq;
 648        }
 649
 650        netdev_dbg(netdev, "initial replenish cycle\n");
 651        ibmveth_interrupt(netdev->irq, netdev);
 652
 653        netif_start_queue(netdev);
 654
 655        netdev_dbg(netdev, "open complete\n");
 656
 657        return 0;
 658
 659err_out_free_irq:
 660        free_irq(netdev->irq, netdev);
 661err_out:
 662        ibmveth_cleanup(adapter);
 663        napi_disable(&adapter->napi);
 664        return rc;
 665}
 666
 667static int ibmveth_close(struct net_device *netdev)
 668{
 669        struct ibmveth_adapter *adapter = netdev_priv(netdev);
 670        long lpar_rc;
 671
 672        netdev_dbg(netdev, "close starting\n");
 673
 674        napi_disable(&adapter->napi);
 675
 676        if (!adapter->pool_config)
 677                netif_stop_queue(netdev);
 678
 679        h_vio_signal(adapter->vdev->unit_address, VIO_IRQ_DISABLE);
 680
 681        do {
 682                lpar_rc = h_free_logical_lan(adapter->vdev->unit_address);
 683        } while (H_IS_LONG_BUSY(lpar_rc) || (lpar_rc == H_BUSY));
 684
 685        if (lpar_rc != H_SUCCESS) {
 686                netdev_err(netdev, "h_free_logical_lan failed with %lx, "
 687                           "continuing with close\n", lpar_rc);
 688        }
 689
 690        free_irq(netdev->irq, netdev);
 691
 692        adapter->rx_no_buffer = *(u64 *)(((char *)adapter->buffer_list_addr) +
 693                                                4096 - 8);
 694
 695        ibmveth_cleanup(adapter);
 696
 697        netdev_dbg(netdev, "close complete\n");
 698
 699        return 0;
 700}
 701
 702static int netdev_get_settings(struct net_device *dev, struct ethtool_cmd *cmd)
 703{
 704        cmd->supported = (SUPPORTED_1000baseT_Full | SUPPORTED_Autoneg |
 705                                SUPPORTED_FIBRE);
 706        cmd->advertising = (ADVERTISED_1000baseT_Full | ADVERTISED_Autoneg |
 707                                ADVERTISED_FIBRE);
 708        ethtool_cmd_speed_set(cmd, SPEED_1000);
 709        cmd->duplex = DUPLEX_FULL;
 710        cmd->port = PORT_FIBRE;
 711        cmd->phy_address = 0;
 712        cmd->transceiver = XCVR_INTERNAL;
 713        cmd->autoneg = AUTONEG_ENABLE;
 714        cmd->maxtxpkt = 0;
 715        cmd->maxrxpkt = 1;
 716        return 0;
 717}
 718
 719static void netdev_get_drvinfo(struct net_device *dev,
 720                               struct ethtool_drvinfo *info)
 721{
 722        strlcpy(info->driver, ibmveth_driver_name, sizeof(info->driver));
 723        strlcpy(info->version, ibmveth_driver_version, sizeof(info->version));
 724}
 725
 726static netdev_features_t ibmveth_fix_features(struct net_device *dev,
 727        netdev_features_t features)
 728{
 729        /*
 730         * Since the ibmveth firmware interface does not have the
 731         * concept of separate tx/rx checksum offload enable, if rx
 732         * checksum is disabled we also have to disable tx checksum
 733         * offload. Once we disable rx checksum offload, we are no
 734         * longer allowed to send tx buffers that are not properly
 735         * checksummed.
 736         */
 737
 738        if (!(features & NETIF_F_RXCSUM))
 739                features &= ~NETIF_F_ALL_CSUM;
 740
 741        return features;
 742}
 743
 744static int ibmveth_set_csum_offload(struct net_device *dev, u32 data)
 745{
 746        struct ibmveth_adapter *adapter = netdev_priv(dev);
 747        unsigned long set_attr, clr_attr, ret_attr;
 748        unsigned long set_attr6, clr_attr6;
 749        long ret, ret4, ret6;
 750        int rc1 = 0, rc2 = 0;
 751        int restart = 0;
 752
 753        if (netif_running(dev)) {
 754                restart = 1;
 755                adapter->pool_config = 1;
 756                ibmveth_close(dev);
 757                adapter->pool_config = 0;
 758        }
 759
 760        set_attr = 0;
 761        clr_attr = 0;
 762        set_attr6 = 0;
 763        clr_attr6 = 0;
 764
 765        if (data) {
 766                set_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
 767                set_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
 768        } else {
 769                clr_attr = IBMVETH_ILLAN_IPV4_TCP_CSUM;
 770                clr_attr6 = IBMVETH_ILLAN_IPV6_TCP_CSUM;
 771        }
 772
 773        ret = h_illan_attributes(adapter->vdev->unit_address, 0, 0, &ret_attr);
 774
 775        if (ret == H_SUCCESS && !(ret_attr & IBMVETH_ILLAN_ACTIVE_TRUNK) &&
 776            !(ret_attr & IBMVETH_ILLAN_TRUNK_PRI_MASK) &&
 777            (ret_attr & IBMVETH_ILLAN_PADDED_PKT_CSUM)) {
 778                ret4 = h_illan_attributes(adapter->vdev->unit_address, clr_attr,
 779                                         set_attr, &ret_attr);
 780
 781                if (ret4 != H_SUCCESS) {
 782                        netdev_err(dev, "unable to change IPv4 checksum "
 783                                        "offload settings. %d rc=%ld\n",
 784                                        data, ret4);
 785
 786                        h_illan_attributes(adapter->vdev->unit_address,
 787                                           set_attr, clr_attr, &ret_attr);
 788
 789                        if (data == 1)
 790                                dev->features &= ~NETIF_F_IP_CSUM;
 791
 792                } else {
 793                        adapter->fw_ipv4_csum_support = data;
 794                }
 795
 796                ret6 = h_illan_attributes(adapter->vdev->unit_address,
 797                                         clr_attr6, set_attr6, &ret_attr);
 798
 799                if (ret6 != H_SUCCESS) {
 800                        netdev_err(dev, "unable to change IPv6 checksum "
 801                                        "offload settings. %d rc=%ld\n",
 802                                        data, ret6);
 803
 804                        h_illan_attributes(adapter->vdev->unit_address,
 805                                           set_attr6, clr_attr6, &ret_attr);
 806
 807                        if (data == 1)
 808                                dev->features &= ~NETIF_F_IPV6_CSUM;
 809
 810                } else
 811                        adapter->fw_ipv6_csum_support = data;
 812
 813                if (ret4 == H_SUCCESS || ret6 == H_SUCCESS)
 814                        adapter->rx_csum = data;
 815                else
 816                        rc1 = -EIO;
 817        } else {
 818                rc1 = -EIO;
 819                netdev_err(dev, "unable to change checksum offload settings."
 820                                     " %d rc=%ld ret_attr=%lx\n", data, ret,
 821                                     ret_attr);
 822        }
 823
 824        if (restart)
 825                rc2 = ibmveth_open(dev);
 826
 827        return rc1 ? rc1 : rc2;
 828}
 829
 830static int ibmveth_set_features(struct net_device *dev,
 831        netdev_features_t features)
 832{
 833        struct ibmveth_adapter *adapter = netdev_priv(dev);
 834        int rx_csum = !!(features & NETIF_F_RXCSUM);
 835        int rc;
 836
 837        if (rx_csum == adapter->rx_csum)
 838                return 0;
 839
 840        rc = ibmveth_set_csum_offload(dev, rx_csum);
 841        if (rc && !adapter->rx_csum)
 842                dev->features = features & ~(NETIF_F_ALL_CSUM | NETIF_F_RXCSUM);
 843
 844        return rc;
 845}
 846
 847static void ibmveth_get_strings(struct net_device *dev, u32 stringset, u8 *data)
 848{
 849        int i;
 850
 851        if (stringset != ETH_SS_STATS)
 852                return;
 853
 854        for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++, data += ETH_GSTRING_LEN)
 855                memcpy(data, ibmveth_stats[i].name, ETH_GSTRING_LEN);
 856}
 857
 858static int ibmveth_get_sset_count(struct net_device *dev, int sset)
 859{
 860        switch (sset) {
 861        case ETH_SS_STATS:
 862                return ARRAY_SIZE(ibmveth_stats);
 863        default:
 864                return -EOPNOTSUPP;
 865        }
 866}
 867
 868static void ibmveth_get_ethtool_stats(struct net_device *dev,
 869                                      struct ethtool_stats *stats, u64 *data)
 870{
 871        int i;
 872        struct ibmveth_adapter *adapter = netdev_priv(dev);
 873
 874        for (i = 0; i < ARRAY_SIZE(ibmveth_stats); i++)
 875                data[i] = IBMVETH_GET_STAT(adapter, ibmveth_stats[i].offset);
 876}
 877
 878static const struct ethtool_ops netdev_ethtool_ops = {
 879        .get_drvinfo            = netdev_get_drvinfo,
 880        .get_settings           = netdev_get_settings,
 881        .get_link               = ethtool_op_get_link,
 882        .get_strings            = ibmveth_get_strings,
 883        .get_sset_count         = ibmveth_get_sset_count,
 884        .get_ethtool_stats      = ibmveth_get_ethtool_stats,
 885};
 886
 887static int ibmveth_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
 888{
 889        return -EOPNOTSUPP;
 890}
 891
 892#define page_offset(v) ((unsigned long)(v) & ((1 << 12) - 1))
 893
 894static int ibmveth_send(struct ibmveth_adapter *adapter,
 895                        union ibmveth_buf_desc *descs)
 896{
 897        unsigned long correlator;
 898        unsigned int retry_count;
 899        unsigned long ret;
 900
 901        /*
 902         * The retry count sets a maximum for the number of broadcast and
 903         * multicast destinations within the system.
 904         */
 905        retry_count = 1024;
 906        correlator = 0;
 907        do {
 908                ret = h_send_logical_lan(adapter->vdev->unit_address,
 909                                             descs[0].desc, descs[1].desc,
 910                                             descs[2].desc, descs[3].desc,
 911                                             descs[4].desc, descs[5].desc,
 912                                             correlator, &correlator);
 913        } while ((ret == H_BUSY) && (retry_count--));
 914
 915        if (ret != H_SUCCESS && ret != H_DROPPED) {
 916                netdev_err(adapter->netdev, "tx: h_send_logical_lan failed "
 917                           "with rc=%ld\n", ret);
 918                return 1;
 919        }
 920
 921        return 0;
 922}
 923
 924static netdev_tx_t ibmveth_start_xmit(struct sk_buff *skb,
 925                                      struct net_device *netdev)
 926{
 927        struct ibmveth_adapter *adapter = netdev_priv(netdev);
 928        unsigned int desc_flags;
 929        union ibmveth_buf_desc descs[6];
 930        int last, i;
 931        int force_bounce = 0;
 932        dma_addr_t dma_addr;
 933
 934        /*
 935         * veth handles a maximum of 6 segments including the header, so
 936         * we have to linearize the skb if there are more than this.
 937         */
 938        if (skb_shinfo(skb)->nr_frags > 5 && __skb_linearize(skb)) {
 939                netdev->stats.tx_dropped++;
 940                goto out;
 941        }
 942
 943        /* veth can't checksum offload UDP */
 944        if (skb->ip_summed == CHECKSUM_PARTIAL &&
 945            ((skb->protocol == htons(ETH_P_IP) &&
 946              ip_hdr(skb)->protocol != IPPROTO_TCP) ||
 947             (skb->protocol == htons(ETH_P_IPV6) &&
 948              ipv6_hdr(skb)->nexthdr != IPPROTO_TCP)) &&
 949            skb_checksum_help(skb)) {
 950
 951                netdev_err(netdev, "tx: failed to checksum packet\n");
 952                netdev->stats.tx_dropped++;
 953                goto out;
 954        }
 955
 956        desc_flags = IBMVETH_BUF_VALID;
 957
 958        if (skb->ip_summed == CHECKSUM_PARTIAL) {
 959                unsigned char *buf = skb_transport_header(skb) +
 960                                                skb->csum_offset;
 961
 962                desc_flags |= (IBMVETH_BUF_NO_CSUM | IBMVETH_BUF_CSUM_GOOD);
 963
 964                /* Need to zero out the checksum */
 965                buf[0] = 0;
 966                buf[1] = 0;
 967        }
 968
 969retry_bounce:
 970        memset(descs, 0, sizeof(descs));
 971
 972        /*
 973         * If a linear packet is below the rx threshold then
 974         * copy it into the static bounce buffer. This avoids the
 975         * cost of a TCE insert and remove.
 976         */
 977        if (force_bounce || (!skb_is_nonlinear(skb) &&
 978                                (skb->len < tx_copybreak))) {
 979                skb_copy_from_linear_data(skb, adapter->bounce_buffer,
 980                                          skb->len);
 981
 982                descs[0].fields.flags_len = desc_flags | skb->len;
 983                descs[0].fields.address = adapter->bounce_buffer_dma;
 984
 985                if (ibmveth_send(adapter, descs)) {
 986                        adapter->tx_send_failed++;
 987                        netdev->stats.tx_dropped++;
 988                } else {
 989                        netdev->stats.tx_packets++;
 990                        netdev->stats.tx_bytes += skb->len;
 991                }
 992
 993                goto out;
 994        }
 995
 996        /* Map the header */
 997        dma_addr = dma_map_single(&adapter->vdev->dev, skb->data,
 998                                  skb_headlen(skb), DMA_TO_DEVICE);
 999        if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
1000                goto map_failed;
1001
1002        descs[0].fields.flags_len = desc_flags | skb_headlen(skb);
1003        descs[0].fields.address = dma_addr;
1004
1005        /* Map the frags */
1006        for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
1007                const skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
1008
1009                dma_addr = skb_frag_dma_map(&adapter->vdev->dev, frag, 0,
1010                                            skb_frag_size(frag), DMA_TO_DEVICE);
1011
1012                if (dma_mapping_error(&adapter->vdev->dev, dma_addr))
1013                        goto map_failed_frags;
1014
1015                descs[i+1].fields.flags_len = desc_flags | skb_frag_size(frag);
1016                descs[i+1].fields.address = dma_addr;
1017        }
1018
1019        if (ibmveth_send(adapter, descs)) {
1020                adapter->tx_send_failed++;
1021                netdev->stats.tx_dropped++;
1022        } else {
1023                netdev->stats.tx_packets++;
1024                netdev->stats.tx_bytes += skb->len;
1025        }
1026
1027        dma_unmap_single(&adapter->vdev->dev,
1028                         descs[0].fields.address,
1029                         descs[0].fields.flags_len & IBMVETH_BUF_LEN_MASK,
1030                         DMA_TO_DEVICE);
1031
1032        for (i = 1; i < skb_shinfo(skb)->nr_frags + 1; i++)
1033                dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address,
1034                               descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK,
1035                               DMA_TO_DEVICE);
1036
1037out:
1038        dev_kfree_skb(skb);
1039        return NETDEV_TX_OK;
1040
1041map_failed_frags:
1042        last = i+1;
1043        for (i = 0; i < last; i++)
1044                dma_unmap_page(&adapter->vdev->dev, descs[i].fields.address,
1045                               descs[i].fields.flags_len & IBMVETH_BUF_LEN_MASK,
1046                               DMA_TO_DEVICE);
1047
1048map_failed:
1049        if (!firmware_has_feature(FW_FEATURE_CMO))
1050                netdev_err(netdev, "tx: unable to map xmit buffer\n");
1051        adapter->tx_map_failed++;
1052        skb_linearize(skb);
1053        force_bounce = 1;
1054        goto retry_bounce;
1055}
1056
1057static int ibmveth_poll(struct napi_struct *napi, int budget)
1058{
1059        struct ibmveth_adapter *adapter =
1060                        container_of(napi, struct ibmveth_adapter, napi);
1061        struct net_device *netdev = adapter->netdev;
1062        int frames_processed = 0;
1063        unsigned long lpar_rc;
1064
1065restart_poll:
1066        do {
1067                if (!ibmveth_rxq_pending_buffer(adapter))
1068                        break;
1069
1070                smp_rmb();
1071                if (!ibmveth_rxq_buffer_valid(adapter)) {
1072                        wmb(); /* suggested by larson1 */
1073                        adapter->rx_invalid_buffer++;
1074                        netdev_dbg(netdev, "recycling invalid buffer\n");
1075                        ibmveth_rxq_recycle_buffer(adapter);
1076                } else {
1077                        struct sk_buff *skb, *new_skb;
1078                        int length = ibmveth_rxq_frame_length(adapter);
1079                        int offset = ibmveth_rxq_frame_offset(adapter);
1080                        int csum_good = ibmveth_rxq_csum_good(adapter);
1081
1082                        skb = ibmveth_rxq_get_buffer(adapter);
1083
1084                        new_skb = NULL;
1085                        if (length < rx_copybreak)
1086                                new_skb = netdev_alloc_skb(netdev, length);
1087
1088                        if (new_skb) {
1089                                skb_copy_to_linear_data(new_skb,
1090                                                        skb->data + offset,
1091                                                        length);
1092                                if (rx_flush)
1093                                        ibmveth_flush_buffer(skb->data,
1094                                                length + offset);
1095                                if (!ibmveth_rxq_recycle_buffer(adapter))
1096                                        kfree_skb(skb);
1097                                skb = new_skb;
1098                        } else {
1099                                ibmveth_rxq_harvest_buffer(adapter);
1100                                skb_reserve(skb, offset);
1101                        }
1102
1103                        skb_put(skb, length);
1104                        skb->protocol = eth_type_trans(skb, netdev);
1105
1106                        if (csum_good)
1107                                skb->ip_summed = CHECKSUM_UNNECESSARY;
1108
1109                        netif_receive_skb(skb); /* send it up */
1110
1111                        netdev->stats.rx_packets++;
1112                        netdev->stats.rx_bytes += length;
1113                        frames_processed++;
1114                }
1115        } while (frames_processed < budget);
1116
1117        ibmveth_replenish_task(adapter);
1118
1119        if (frames_processed < budget) {
1120                /* We think we are done - reenable interrupts,
1121                 * then check once more to make sure we are done.
1122                 */
1123                lpar_rc = h_vio_signal(adapter->vdev->unit_address,
1124                                       VIO_IRQ_ENABLE);
1125
1126                BUG_ON(lpar_rc != H_SUCCESS);
1127
1128                napi_complete(napi);
1129
1130                if (ibmveth_rxq_pending_buffer(adapter) &&
1131                    napi_reschedule(napi)) {
1132                        lpar_rc = h_vio_signal(adapter->vdev->unit_address,
1133                                               VIO_IRQ_DISABLE);
1134                        goto restart_poll;
1135                }
1136        }
1137
1138        return frames_processed;
1139}
1140
1141static irqreturn_t ibmveth_interrupt(int irq, void *dev_instance)
1142{
1143        struct net_device *netdev = dev_instance;
1144        struct ibmveth_adapter *adapter = netdev_priv(netdev);
1145        unsigned long lpar_rc;
1146
1147        if (napi_schedule_prep(&adapter->napi)) {
1148                lpar_rc = h_vio_signal(adapter->vdev->unit_address,
1149                                       VIO_IRQ_DISABLE);
1150                BUG_ON(lpar_rc != H_SUCCESS);
1151                __napi_schedule(&adapter->napi);
1152        }
1153        return IRQ_HANDLED;
1154}
1155
1156static void ibmveth_set_multicast_list(struct net_device *netdev)
1157{
1158        struct ibmveth_adapter *adapter = netdev_priv(netdev);
1159        unsigned long lpar_rc;
1160
1161        if ((netdev->flags & IFF_PROMISC) ||
1162            (netdev_mc_count(netdev) > adapter->mcastFilterSize)) {
1163                lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
1164                                           IbmVethMcastEnableRecv |
1165                                           IbmVethMcastDisableFiltering,
1166                                           0);
1167                if (lpar_rc != H_SUCCESS) {
1168                        netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
1169                                   "entering promisc mode\n", lpar_rc);
1170                }
1171        } else {
1172                struct netdev_hw_addr *ha;
1173                /* clear the filter table & disable filtering */
1174                lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
1175                                           IbmVethMcastEnableRecv |
1176                                           IbmVethMcastDisableFiltering |
1177                                           IbmVethMcastClearFilterTable,
1178                                           0);
1179                if (lpar_rc != H_SUCCESS) {
1180                        netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
1181                                   "attempting to clear filter table\n",
1182                                   lpar_rc);
1183                }
1184                /* add the addresses to the filter table */
1185                netdev_for_each_mc_addr(ha, netdev) {
1186                        /* add the multicast address to the filter table */
1187                        unsigned long mcast_addr = 0;
1188                        memcpy(((char *)&mcast_addr)+2, ha->addr, 6);
1189                        lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
1190                                                   IbmVethMcastAddFilter,
1191                                                   mcast_addr);
1192                        if (lpar_rc != H_SUCCESS) {
1193                                netdev_err(netdev, "h_multicast_ctrl rc=%ld "
1194                                           "when adding an entry to the filter "
1195                                           "table\n", lpar_rc);
1196                        }
1197                }
1198
1199                /* re-enable filtering */
1200                lpar_rc = h_multicast_ctrl(adapter->vdev->unit_address,
1201                                           IbmVethMcastEnableFiltering,
1202                                           0);
1203                if (lpar_rc != H_SUCCESS) {
1204                        netdev_err(netdev, "h_multicast_ctrl rc=%ld when "
1205                                   "enabling filtering\n", lpar_rc);
1206                }
1207        }
1208}
1209
1210static int ibmveth_change_mtu(struct net_device *dev, int new_mtu)
1211{
1212        struct ibmveth_adapter *adapter = netdev_priv(dev);
1213        struct vio_dev *viodev = adapter->vdev;
1214        int new_mtu_oh = new_mtu + IBMVETH_BUFF_OH;
1215        int i, rc;
1216        int need_restart = 0;
1217
1218        if (new_mtu < IBMVETH_MIN_MTU)
1219                return -EINVAL;
1220
1221        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
1222                if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size)
1223                        break;
1224
1225        if (i == IBMVETH_NUM_BUFF_POOLS)
1226                return -EINVAL;
1227
1228        /* Deactivate all the buffer pools so that the next loop can activate
1229           only the buffer pools necessary to hold the new MTU */
1230        if (netif_running(adapter->netdev)) {
1231                need_restart = 1;
1232                adapter->pool_config = 1;
1233                ibmveth_close(adapter->netdev);
1234                adapter->pool_config = 0;
1235        }
1236
1237        /* Look for an active buffer pool that can hold the new MTU */
1238        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
1239                adapter->rx_buff_pool[i].active = 1;
1240
1241                if (new_mtu_oh < adapter->rx_buff_pool[i].buff_size) {
1242                        dev->mtu = new_mtu;
1243                        vio_cmo_set_dev_desired(viodev,
1244                                                ibmveth_get_desired_dma
1245                                                (viodev));
1246                        if (need_restart) {
1247                                return ibmveth_open(adapter->netdev);
1248                        }
1249                        return 0;
1250                }
1251        }
1252
1253        if (need_restart && (rc = ibmveth_open(adapter->netdev)))
1254                return rc;
1255
1256        return -EINVAL;
1257}
1258
1259#ifdef CONFIG_NET_POLL_CONTROLLER
1260static void ibmveth_poll_controller(struct net_device *dev)
1261{
1262        ibmveth_replenish_task(netdev_priv(dev));
1263        ibmveth_interrupt(dev->irq, dev);
1264}
1265#endif
1266
1267/**
1268 * ibmveth_get_desired_dma - Calculate IO memory desired by the driver
1269 *
1270 * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
1271 *
1272 * Return value:
1273 *      Number of bytes of IO data the driver will need to perform well.
1274 */
1275static unsigned long ibmveth_get_desired_dma(struct vio_dev *vdev)
1276{
1277        struct net_device *netdev = dev_get_drvdata(&vdev->dev);
1278        struct ibmveth_adapter *adapter;
1279        unsigned long ret;
1280        int i;
1281        int rxqentries = 1;
1282
1283        /* netdev inits at probe time along with the structures we need below*/
1284        if (netdev == NULL)
1285                return IOMMU_PAGE_ALIGN(IBMVETH_IO_ENTITLEMENT_DEFAULT);
1286
1287        adapter = netdev_priv(netdev);
1288
1289        ret = IBMVETH_BUFF_LIST_SIZE + IBMVETH_FILT_LIST_SIZE;
1290        ret += IOMMU_PAGE_ALIGN(netdev->mtu);
1291
1292        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
1293                /* add the size of the active receive buffers */
1294                if (adapter->rx_buff_pool[i].active)
1295                        ret +=
1296                            adapter->rx_buff_pool[i].size *
1297                            IOMMU_PAGE_ALIGN(adapter->rx_buff_pool[i].
1298                                    buff_size);
1299                rxqentries += adapter->rx_buff_pool[i].size;
1300        }
1301        /* add the size of the receive queue entries */
1302        ret += IOMMU_PAGE_ALIGN(rxqentries * sizeof(struct ibmveth_rx_q_entry));
1303
1304        return ret;
1305}
1306
1307static const struct net_device_ops ibmveth_netdev_ops = {
1308        .ndo_open               = ibmveth_open,
1309        .ndo_stop               = ibmveth_close,
1310        .ndo_start_xmit         = ibmveth_start_xmit,
1311        .ndo_set_rx_mode        = ibmveth_set_multicast_list,
1312        .ndo_do_ioctl           = ibmveth_ioctl,
1313        .ndo_change_mtu         = ibmveth_change_mtu,
1314        .ndo_fix_features       = ibmveth_fix_features,
1315        .ndo_set_features       = ibmveth_set_features,
1316        .ndo_validate_addr      = eth_validate_addr,
1317        .ndo_set_mac_address    = eth_mac_addr,
1318#ifdef CONFIG_NET_POLL_CONTROLLER
1319        .ndo_poll_controller    = ibmveth_poll_controller,
1320#endif
1321};
1322
1323static int ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id)
1324{
1325        int rc, i, mac_len;
1326        struct net_device *netdev;
1327        struct ibmveth_adapter *adapter;
1328        unsigned char *mac_addr_p;
1329        unsigned int *mcastFilterSize_p;
1330
1331        dev_dbg(&dev->dev, "entering ibmveth_probe for UA 0x%x\n",
1332                dev->unit_address);
1333
1334        mac_addr_p = (unsigned char *)vio_get_attribute(dev, VETH_MAC_ADDR,
1335                                                        &mac_len);
1336        if (!mac_addr_p) {
1337                dev_err(&dev->dev, "Can't find VETH_MAC_ADDR attribute\n");
1338                return -EINVAL;
1339        }
1340        /* Workaround for old/broken pHyp */
1341        if (mac_len == 8)
1342                mac_addr_p += 2;
1343        else if (mac_len != 6) {
1344                dev_err(&dev->dev, "VETH_MAC_ADDR attribute wrong len %d\n",
1345                        mac_len);
1346                return -EINVAL;
1347        }
1348
1349        mcastFilterSize_p = (unsigned int *)vio_get_attribute(dev,
1350                                                VETH_MCAST_FILTER_SIZE, NULL);
1351        if (!mcastFilterSize_p) {
1352                dev_err(&dev->dev, "Can't find VETH_MCAST_FILTER_SIZE "
1353                        "attribute\n");
1354                return -EINVAL;
1355        }
1356
1357        netdev = alloc_etherdev(sizeof(struct ibmveth_adapter));
1358
1359        if (!netdev)
1360                return -ENOMEM;
1361
1362        adapter = netdev_priv(netdev);
1363        dev_set_drvdata(&dev->dev, netdev);
1364
1365        adapter->vdev = dev;
1366        adapter->netdev = netdev;
1367        adapter->mcastFilterSize = *mcastFilterSize_p;
1368        adapter->pool_config = 0;
1369
1370        netif_napi_add(netdev, &adapter->napi, ibmveth_poll, 16);
1371
1372        adapter->mac_addr = 0;
1373        memcpy(&adapter->mac_addr, mac_addr_p, 6);
1374
1375        netdev->irq = dev->irq;
1376        netdev->netdev_ops = &ibmveth_netdev_ops;
1377        netdev->ethtool_ops = &netdev_ethtool_ops;
1378        SET_NETDEV_DEV(netdev, &dev->dev);
1379        netdev->hw_features = NETIF_F_SG | NETIF_F_RXCSUM |
1380                NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM;
1381        netdev->features |= netdev->hw_features;
1382
1383        memcpy(netdev->dev_addr, &adapter->mac_addr, netdev->addr_len);
1384
1385        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
1386                struct kobject *kobj = &adapter->rx_buff_pool[i].kobj;
1387                int error;
1388
1389                ibmveth_init_buffer_pool(&adapter->rx_buff_pool[i], i,
1390                                         pool_count[i], pool_size[i],
1391                                         pool_active[i]);
1392                error = kobject_init_and_add(kobj, &ktype_veth_pool,
1393                                             &dev->dev.kobj, "pool%d", i);
1394                if (!error)
1395                        kobject_uevent(kobj, KOBJ_ADD);
1396        }
1397
1398        netdev_dbg(netdev, "adapter @ 0x%p\n", adapter);
1399
1400        adapter->buffer_list_dma = DMA_ERROR_CODE;
1401        adapter->filter_list_dma = DMA_ERROR_CODE;
1402        adapter->rx_queue.queue_dma = DMA_ERROR_CODE;
1403
1404        netdev_dbg(netdev, "registering netdev...\n");
1405
1406        ibmveth_set_features(netdev, netdev->features);
1407
1408        rc = register_netdev(netdev);
1409
1410        if (rc) {
1411                netdev_dbg(netdev, "failed to register netdev rc=%d\n", rc);
1412                free_netdev(netdev);
1413                return rc;
1414        }
1415
1416        netdev_dbg(netdev, "registered\n");
1417
1418        return 0;
1419}
1420
1421static int ibmveth_remove(struct vio_dev *dev)
1422{
1423        struct net_device *netdev = dev_get_drvdata(&dev->dev);
1424        struct ibmveth_adapter *adapter = netdev_priv(netdev);
1425        int i;
1426
1427        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++)
1428                kobject_put(&adapter->rx_buff_pool[i].kobj);
1429
1430        unregister_netdev(netdev);
1431
1432        free_netdev(netdev);
1433        dev_set_drvdata(&dev->dev, NULL);
1434
1435        return 0;
1436}
1437
1438static struct attribute veth_active_attr;
1439static struct attribute veth_num_attr;
1440static struct attribute veth_size_attr;
1441
1442static ssize_t veth_pool_show(struct kobject *kobj,
1443                              struct attribute *attr, char *buf)
1444{
1445        struct ibmveth_buff_pool *pool = container_of(kobj,
1446                                                      struct ibmveth_buff_pool,
1447                                                      kobj);
1448
1449        if (attr == &veth_active_attr)
1450                return sprintf(buf, "%d\n", pool->active);
1451        else if (attr == &veth_num_attr)
1452                return sprintf(buf, "%d\n", pool->size);
1453        else if (attr == &veth_size_attr)
1454                return sprintf(buf, "%d\n", pool->buff_size);
1455        return 0;
1456}
1457
1458static ssize_t veth_pool_store(struct kobject *kobj, struct attribute *attr,
1459                               const char *buf, size_t count)
1460{
1461        struct ibmveth_buff_pool *pool = container_of(kobj,
1462                                                      struct ibmveth_buff_pool,
1463                                                      kobj);
1464        struct net_device *netdev = dev_get_drvdata(
1465            container_of(kobj->parent, struct device, kobj));
1466        struct ibmveth_adapter *adapter = netdev_priv(netdev);
1467        long value = simple_strtol(buf, NULL, 10);
1468        long rc;
1469
1470        if (attr == &veth_active_attr) {
1471                if (value && !pool->active) {
1472                        if (netif_running(netdev)) {
1473                                if (ibmveth_alloc_buffer_pool(pool)) {
1474                                        netdev_err(netdev,
1475                                                   "unable to alloc pool\n");
1476                                        return -ENOMEM;
1477                                }
1478                                pool->active = 1;
1479                                adapter->pool_config = 1;
1480                                ibmveth_close(netdev);
1481                                adapter->pool_config = 0;
1482                                if ((rc = ibmveth_open(netdev)))
1483                                        return rc;
1484                        } else {
1485                                pool->active = 1;
1486                        }
1487                } else if (!value && pool->active) {
1488                        int mtu = netdev->mtu + IBMVETH_BUFF_OH;
1489                        int i;
1490                        /* Make sure there is a buffer pool with buffers that
1491                           can hold a packet of the size of the MTU */
1492                        for (i = 0; i < IBMVETH_NUM_BUFF_POOLS; i++) {
1493                                if (pool == &adapter->rx_buff_pool[i])
1494                                        continue;
1495                                if (!adapter->rx_buff_pool[i].active)
1496                                        continue;
1497                                if (mtu <= adapter->rx_buff_pool[i].buff_size)
1498                                        break;
1499                        }
1500
1501                        if (i == IBMVETH_NUM_BUFF_POOLS) {
1502                                netdev_err(netdev, "no active pool >= MTU\n");
1503                                return -EPERM;
1504                        }
1505
1506                        if (netif_running(netdev)) {
1507                                adapter->pool_config = 1;
1508                                ibmveth_close(netdev);
1509                                pool->active = 0;
1510                                adapter->pool_config = 0;
1511                                if ((rc = ibmveth_open(netdev)))
1512                                        return rc;
1513                        }
1514                        pool->active = 0;
1515                }
1516        } else if (attr == &veth_num_attr) {
1517                if (value <= 0 || value > IBMVETH_MAX_POOL_COUNT) {
1518                        return -EINVAL;
1519                } else {
1520                        if (netif_running(netdev)) {
1521                                adapter->pool_config = 1;
1522                                ibmveth_close(netdev);
1523                                adapter->pool_config = 0;
1524                                pool->size = value;
1525                                if ((rc = ibmveth_open(netdev)))
1526                                        return rc;
1527                        } else {
1528                                pool->size = value;
1529                        }
1530                }
1531        } else if (attr == &veth_size_attr) {
1532                if (value <= IBMVETH_BUFF_OH || value > IBMVETH_MAX_BUF_SIZE) {
1533                        return -EINVAL;
1534                } else {
1535                        if (netif_running(netdev)) {
1536                                adapter->pool_config = 1;
1537                                ibmveth_close(netdev);
1538                                adapter->pool_config = 0;
1539                                pool->buff_size = value;
1540                                if ((rc = ibmveth_open(netdev)))
1541                                        return rc;
1542                        } else {
1543                                pool->buff_size = value;
1544                        }
1545                }
1546        }
1547
1548        /* kick the interrupt handler to allocate/deallocate pools */
1549        ibmveth_interrupt(netdev->irq, netdev);
1550        return count;
1551}
1552
1553
1554#define ATTR(_name, _mode)                              \
1555        struct attribute veth_##_name##_attr = {        \
1556        .name = __stringify(_name), .mode = _mode,      \
1557        };
1558
1559static ATTR(active, 0644);
1560static ATTR(num, 0644);
1561static ATTR(size, 0644);
1562
1563static struct attribute *veth_pool_attrs[] = {
1564        &veth_active_attr,
1565        &veth_num_attr,
1566        &veth_size_attr,
1567        NULL,
1568};
1569
1570static const struct sysfs_ops veth_pool_ops = {
1571        .show   = veth_pool_show,
1572        .store  = veth_pool_store,
1573};
1574
1575static struct kobj_type ktype_veth_pool = {
1576        .release        = NULL,
1577        .sysfs_ops      = &veth_pool_ops,
1578        .default_attrs  = veth_pool_attrs,
1579};
1580
1581static int ibmveth_resume(struct device *dev)
1582{
1583        struct net_device *netdev = dev_get_drvdata(dev);
1584        ibmveth_interrupt(netdev->irq, netdev);
1585        return 0;
1586}
1587
1588static struct vio_device_id ibmveth_device_table[] = {
1589        { "network", "IBM,l-lan"},
1590        { "", "" }
1591};
1592MODULE_DEVICE_TABLE(vio, ibmveth_device_table);
1593
1594static struct dev_pm_ops ibmveth_pm_ops = {
1595        .resume = ibmveth_resume
1596};
1597
1598static struct vio_driver ibmveth_driver = {
1599        .id_table       = ibmveth_device_table,
1600        .probe          = ibmveth_probe,
1601        .remove         = ibmveth_remove,
1602        .get_desired_dma = ibmveth_get_desired_dma,
1603        .name           = ibmveth_driver_name,
1604        .pm             = &ibmveth_pm_ops,
1605};
1606
1607static int __init ibmveth_module_init(void)
1608{
1609        printk(KERN_DEBUG "%s: %s %s\n", ibmveth_driver_name,
1610               ibmveth_driver_string, ibmveth_driver_version);
1611
1612        return vio_register_driver(&ibmveth_driver);
1613}
1614
1615static void __exit ibmveth_module_exit(void)
1616{
1617        vio_unregister_driver(&ibmveth_driver);
1618}
1619
1620module_init(ibmveth_module_init);
1621module_exit(ibmveth_module_exit);
1622