linux/drivers/pci/pcie/aspm.c
<<
>>
Prefs
   1/*
   2 * File:        drivers/pci/pcie/aspm.c
   3 * Enabling PCIe link L0s/L1 state and Clock Power Management
   4 *
   5 * Copyright (C) 2007 Intel
   6 * Copyright (C) Zhang Yanmin (yanmin.zhang@intel.com)
   7 * Copyright (C) Shaohua Li (shaohua.li@intel.com)
   8 */
   9
  10#include <linux/kernel.h>
  11#include <linux/module.h>
  12#include <linux/moduleparam.h>
  13#include <linux/pci.h>
  14#include <linux/pci_regs.h>
  15#include <linux/errno.h>
  16#include <linux/pm.h>
  17#include <linux/init.h>
  18#include <linux/slab.h>
  19#include <linux/jiffies.h>
  20#include <linux/delay.h>
  21#include <linux/pci-aspm.h>
  22#include "../pci.h"
  23
  24#ifdef MODULE_PARAM_PREFIX
  25#undef MODULE_PARAM_PREFIX
  26#endif
  27#define MODULE_PARAM_PREFIX "pcie_aspm."
  28
  29/* Note: those are not register definitions */
  30#define ASPM_STATE_L0S_UP       (1)     /* Upstream direction L0s state */
  31#define ASPM_STATE_L0S_DW       (2)     /* Downstream direction L0s state */
  32#define ASPM_STATE_L1           (4)     /* L1 state */
  33#define ASPM_STATE_L0S          (ASPM_STATE_L0S_UP | ASPM_STATE_L0S_DW)
  34#define ASPM_STATE_ALL          (ASPM_STATE_L0S | ASPM_STATE_L1)
  35
  36struct aspm_latency {
  37        u32 l0s;                        /* L0s latency (nsec) */
  38        u32 l1;                         /* L1 latency (nsec) */
  39};
  40
  41struct pcie_link_state {
  42        struct pci_dev *pdev;           /* Upstream component of the Link */
  43        struct pcie_link_state *root;   /* pointer to the root port link */
  44        struct pcie_link_state *parent; /* pointer to the parent Link state */
  45        struct list_head sibling;       /* node in link_list */
  46        struct list_head children;      /* list of child link states */
  47        struct list_head link;          /* node in parent's children list */
  48
  49        /* ASPM state */
  50        u32 aspm_support:3;             /* Supported ASPM state */
  51        u32 aspm_enabled:3;             /* Enabled ASPM state */
  52        u32 aspm_capable:3;             /* Capable ASPM state with latency */
  53        u32 aspm_default:3;             /* Default ASPM state by BIOS */
  54        u32 aspm_disable:3;             /* Disabled ASPM state */
  55
  56        /* Clock PM state */
  57        u32 clkpm_capable:1;            /* Clock PM capable? */
  58        u32 clkpm_enabled:1;            /* Current Clock PM state */
  59        u32 clkpm_default:1;            /* Default Clock PM state by BIOS */
  60
  61        /* Exit latencies */
  62        struct aspm_latency latency_up; /* Upstream direction exit latency */
  63        struct aspm_latency latency_dw; /* Downstream direction exit latency */
  64        /*
  65         * Endpoint acceptable latencies. A pcie downstream port only
  66         * has one slot under it, so at most there are 8 functions.
  67         */
  68        struct aspm_latency acceptable[8];
  69};
  70
  71static int aspm_disabled, aspm_force, aspm_clear_state;
  72static DEFINE_MUTEX(aspm_lock);
  73static LIST_HEAD(link_list);
  74
  75#define POLICY_DEFAULT 0        /* BIOS default setting */
  76#define POLICY_PERFORMANCE 1    /* high performance */
  77#define POLICY_POWERSAVE 2      /* high power saving */
  78static int aspm_policy;
  79static const char *policy_str[] = {
  80        [POLICY_DEFAULT] = "default",
  81        [POLICY_PERFORMANCE] = "performance",
  82        [POLICY_POWERSAVE] = "powersave"
  83};
  84
  85#define LINK_RETRAIN_TIMEOUT HZ
  86
  87static int policy_to_aspm_state(struct pcie_link_state *link)
  88{
  89        switch (aspm_policy) {
  90        case POLICY_PERFORMANCE:
  91                /* Disable ASPM and Clock PM */
  92                return 0;
  93        case POLICY_POWERSAVE:
  94                /* Enable ASPM L0s/L1 */
  95                return ASPM_STATE_ALL;
  96        case POLICY_DEFAULT:
  97                return link->aspm_default;
  98        }
  99        return 0;
 100}
 101
 102static int policy_to_clkpm_state(struct pcie_link_state *link)
 103{
 104        switch (aspm_policy) {
 105        case POLICY_PERFORMANCE:
 106                /* Disable ASPM and Clock PM */
 107                return 0;
 108        case POLICY_POWERSAVE:
 109                /* Disable Clock PM */
 110                return 1;
 111        case POLICY_DEFAULT:
 112                return link->clkpm_default;
 113        }
 114        return 0;
 115}
 116
 117static void pcie_set_clkpm_nocheck(struct pcie_link_state *link, int enable)
 118{
 119        int pos;
 120        u16 reg16;
 121        struct pci_dev *child;
 122        struct pci_bus *linkbus = link->pdev->subordinate;
 123
 124        list_for_each_entry(child, &linkbus->devices, bus_list) {
 125                pos = pci_pcie_cap(child);
 126                if (!pos)
 127                        return;
 128                pci_read_config_word(child, pos + PCI_EXP_LNKCTL, &reg16);
 129                if (enable)
 130                        reg16 |= PCI_EXP_LNKCTL_CLKREQ_EN;
 131                else
 132                        reg16 &= ~PCI_EXP_LNKCTL_CLKREQ_EN;
 133                pci_write_config_word(child, pos + PCI_EXP_LNKCTL, reg16);
 134        }
 135        link->clkpm_enabled = !!enable;
 136}
 137
 138static void pcie_set_clkpm(struct pcie_link_state *link, int enable)
 139{
 140        /* Don't enable Clock PM if the link is not Clock PM capable */
 141        if (!link->clkpm_capable && enable)
 142                enable = 0;
 143        /* Need nothing if the specified equals to current state */
 144        if (link->clkpm_enabled == enable)
 145                return;
 146        pcie_set_clkpm_nocheck(link, enable);
 147}
 148
 149static void pcie_clkpm_cap_init(struct pcie_link_state *link, int blacklist)
 150{
 151        int pos, capable = 1, enabled = 1;
 152        u32 reg32;
 153        u16 reg16;
 154        struct pci_dev *child;
 155        struct pci_bus *linkbus = link->pdev->subordinate;
 156
 157        /* All functions should have the same cap and state, take the worst */
 158        list_for_each_entry(child, &linkbus->devices, bus_list) {
 159                pos = pci_pcie_cap(child);
 160                if (!pos)
 161                        return;
 162                pci_read_config_dword(child, pos + PCI_EXP_LNKCAP, &reg32);
 163                if (!(reg32 & PCI_EXP_LNKCAP_CLKPM)) {
 164                        capable = 0;
 165                        enabled = 0;
 166                        break;
 167                }
 168                pci_read_config_word(child, pos + PCI_EXP_LNKCTL, &reg16);
 169                if (!(reg16 & PCI_EXP_LNKCTL_CLKREQ_EN))
 170                        enabled = 0;
 171        }
 172        link->clkpm_enabled = enabled;
 173        link->clkpm_default = enabled;
 174        link->clkpm_capable = (blacklist) ? 0 : capable;
 175}
 176
 177/*
 178 * pcie_aspm_configure_common_clock: check if the 2 ends of a link
 179 *   could use common clock. If they are, configure them to use the
 180 *   common clock. That will reduce the ASPM state exit latency.
 181 */
 182static void pcie_aspm_configure_common_clock(struct pcie_link_state *link)
 183{
 184        int ppos, cpos, same_clock = 1;
 185        u16 reg16, parent_reg, child_reg[8];
 186        unsigned long start_jiffies;
 187        struct pci_dev *child, *parent = link->pdev;
 188        struct pci_bus *linkbus = parent->subordinate;
 189        /*
 190         * All functions of a slot should have the same Slot Clock
 191         * Configuration, so just check one function
 192         */
 193        child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
 194        BUG_ON(!pci_is_pcie(child));
 195
 196        /* Check downstream component if bit Slot Clock Configuration is 1 */
 197        cpos = pci_pcie_cap(child);
 198        pci_read_config_word(child, cpos + PCI_EXP_LNKSTA, &reg16);
 199        if (!(reg16 & PCI_EXP_LNKSTA_SLC))
 200                same_clock = 0;
 201
 202        /* Check upstream component if bit Slot Clock Configuration is 1 */
 203        ppos = pci_pcie_cap(parent);
 204        pci_read_config_word(parent, ppos + PCI_EXP_LNKSTA, &reg16);
 205        if (!(reg16 & PCI_EXP_LNKSTA_SLC))
 206                same_clock = 0;
 207
 208        /* Configure downstream component, all functions */
 209        list_for_each_entry(child, &linkbus->devices, bus_list) {
 210                cpos = pci_pcie_cap(child);
 211                pci_read_config_word(child, cpos + PCI_EXP_LNKCTL, &reg16);
 212                child_reg[PCI_FUNC(child->devfn)] = reg16;
 213                if (same_clock)
 214                        reg16 |= PCI_EXP_LNKCTL_CCC;
 215                else
 216                        reg16 &= ~PCI_EXP_LNKCTL_CCC;
 217                pci_write_config_word(child, cpos + PCI_EXP_LNKCTL, reg16);
 218        }
 219
 220        /* Configure upstream component */
 221        pci_read_config_word(parent, ppos + PCI_EXP_LNKCTL, &reg16);
 222        parent_reg = reg16;
 223        if (same_clock)
 224                reg16 |= PCI_EXP_LNKCTL_CCC;
 225        else
 226                reg16 &= ~PCI_EXP_LNKCTL_CCC;
 227        pci_write_config_word(parent, ppos + PCI_EXP_LNKCTL, reg16);
 228
 229        /* Retrain link */
 230        reg16 |= PCI_EXP_LNKCTL_RL;
 231        pci_write_config_word(parent, ppos + PCI_EXP_LNKCTL, reg16);
 232
 233        /* Wait for link training end. Break out after waiting for timeout */
 234        start_jiffies = jiffies;
 235        for (;;) {
 236                pci_read_config_word(parent, ppos + PCI_EXP_LNKSTA, &reg16);
 237                if (!(reg16 & PCI_EXP_LNKSTA_LT))
 238                        break;
 239                if (time_after(jiffies, start_jiffies + LINK_RETRAIN_TIMEOUT))
 240                        break;
 241                msleep(1);
 242        }
 243        if (!(reg16 & PCI_EXP_LNKSTA_LT))
 244                return;
 245
 246        /* Training failed. Restore common clock configurations */
 247        dev_printk(KERN_ERR, &parent->dev,
 248                   "ASPM: Could not configure common clock\n");
 249        list_for_each_entry(child, &linkbus->devices, bus_list) {
 250                cpos = pci_pcie_cap(child);
 251                pci_write_config_word(child, cpos + PCI_EXP_LNKCTL,
 252                                      child_reg[PCI_FUNC(child->devfn)]);
 253        }
 254        pci_write_config_word(parent, ppos + PCI_EXP_LNKCTL, parent_reg);
 255}
 256
 257/* Convert L0s latency encoding to ns */
 258static u32 calc_l0s_latency(u32 encoding)
 259{
 260        if (encoding == 0x7)
 261                return (5 * 1000);      /* > 4us */
 262        return (64 << encoding);
 263}
 264
 265/* Convert L0s acceptable latency encoding to ns */
 266static u32 calc_l0s_acceptable(u32 encoding)
 267{
 268        if (encoding == 0x7)
 269                return -1U;
 270        return (64 << encoding);
 271}
 272
 273/* Convert L1 latency encoding to ns */
 274static u32 calc_l1_latency(u32 encoding)
 275{
 276        if (encoding == 0x7)
 277                return (65 * 1000);     /* > 64us */
 278        return (1000 << encoding);
 279}
 280
 281/* Convert L1 acceptable latency encoding to ns */
 282static u32 calc_l1_acceptable(u32 encoding)
 283{
 284        if (encoding == 0x7)
 285                return -1U;
 286        return (1000 << encoding);
 287}
 288
 289struct aspm_register_info {
 290        u32 support:2;
 291        u32 enabled:2;
 292        u32 latency_encoding_l0s;
 293        u32 latency_encoding_l1;
 294};
 295
 296static void pcie_get_aspm_reg(struct pci_dev *pdev,
 297                              struct aspm_register_info *info)
 298{
 299        int pos;
 300        u16 reg16;
 301        u32 reg32;
 302
 303        pos = pci_pcie_cap(pdev);
 304        pci_read_config_dword(pdev, pos + PCI_EXP_LNKCAP, &reg32);
 305        info->support = (reg32 & PCI_EXP_LNKCAP_ASPMS) >> 10;
 306        info->latency_encoding_l0s = (reg32 & PCI_EXP_LNKCAP_L0SEL) >> 12;
 307        info->latency_encoding_l1  = (reg32 & PCI_EXP_LNKCAP_L1EL) >> 15;
 308        pci_read_config_word(pdev, pos + PCI_EXP_LNKCTL, &reg16);
 309        info->enabled = reg16 & PCI_EXP_LNKCTL_ASPMC;
 310}
 311
 312static void pcie_aspm_check_latency(struct pci_dev *endpoint)
 313{
 314        u32 latency, l1_switch_latency = 0;
 315        struct aspm_latency *acceptable;
 316        struct pcie_link_state *link;
 317
 318        /* Device not in D0 doesn't need latency check */
 319        if ((endpoint->current_state != PCI_D0) &&
 320            (endpoint->current_state != PCI_UNKNOWN))
 321                return;
 322
 323        link = endpoint->bus->self->link_state;
 324        acceptable = &link->acceptable[PCI_FUNC(endpoint->devfn)];
 325
 326        while (link) {
 327                /* Check upstream direction L0s latency */
 328                if ((link->aspm_capable & ASPM_STATE_L0S_UP) &&
 329                    (link->latency_up.l0s > acceptable->l0s))
 330                        link->aspm_capable &= ~ASPM_STATE_L0S_UP;
 331
 332                /* Check downstream direction L0s latency */
 333                if ((link->aspm_capable & ASPM_STATE_L0S_DW) &&
 334                    (link->latency_dw.l0s > acceptable->l0s))
 335                        link->aspm_capable &= ~ASPM_STATE_L0S_DW;
 336                /*
 337                 * Check L1 latency.
 338                 * Every switch on the path to root complex need 1
 339                 * more microsecond for L1. Spec doesn't mention L0s.
 340                 */
 341                latency = max_t(u32, link->latency_up.l1, link->latency_dw.l1);
 342                if ((link->aspm_capable & ASPM_STATE_L1) &&
 343                    (latency + l1_switch_latency > acceptable->l1))
 344                        link->aspm_capable &= ~ASPM_STATE_L1;
 345                l1_switch_latency += 1000;
 346
 347                link = link->parent;
 348        }
 349}
 350
 351static void pcie_aspm_cap_init(struct pcie_link_state *link, int blacklist)
 352{
 353        struct pci_dev *child, *parent = link->pdev;
 354        struct pci_bus *linkbus = parent->subordinate;
 355        struct aspm_register_info upreg, dwreg;
 356
 357        if (blacklist) {
 358                /* Set enabled/disable so that we will disable ASPM later */
 359                link->aspm_enabled = ASPM_STATE_ALL;
 360                link->aspm_disable = ASPM_STATE_ALL;
 361                return;
 362        }
 363
 364        /* Configure common clock before checking latencies */
 365        pcie_aspm_configure_common_clock(link);
 366
 367        /* Get upstream/downstream components' register state */
 368        pcie_get_aspm_reg(parent, &upreg);
 369        child = list_entry(linkbus->devices.next, struct pci_dev, bus_list);
 370        pcie_get_aspm_reg(child, &dwreg);
 371
 372        /*
 373         * Setup L0s state
 374         *
 375         * Note that we must not enable L0s in either direction on a
 376         * given link unless components on both sides of the link each
 377         * support L0s.
 378         */
 379        if (dwreg.support & upreg.support & PCIE_LINK_STATE_L0S)
 380                link->aspm_support |= ASPM_STATE_L0S;
 381        if (dwreg.enabled & PCIE_LINK_STATE_L0S)
 382                link->aspm_enabled |= ASPM_STATE_L0S_UP;
 383        if (upreg.enabled & PCIE_LINK_STATE_L0S)
 384                link->aspm_enabled |= ASPM_STATE_L0S_DW;
 385        link->latency_up.l0s = calc_l0s_latency(upreg.latency_encoding_l0s);
 386        link->latency_dw.l0s = calc_l0s_latency(dwreg.latency_encoding_l0s);
 387
 388        /* Setup L1 state */
 389        if (upreg.support & dwreg.support & PCIE_LINK_STATE_L1)
 390                link->aspm_support |= ASPM_STATE_L1;
 391        if (upreg.enabled & dwreg.enabled & PCIE_LINK_STATE_L1)
 392                link->aspm_enabled |= ASPM_STATE_L1;
 393        link->latency_up.l1 = calc_l1_latency(upreg.latency_encoding_l1);
 394        link->latency_dw.l1 = calc_l1_latency(dwreg.latency_encoding_l1);
 395
 396        /* Save default state */
 397        link->aspm_default = link->aspm_enabled;
 398
 399        /* Setup initial capable state. Will be updated later */
 400        link->aspm_capable = link->aspm_support;
 401        /*
 402         * If the downstream component has pci bridge function, don't
 403         * do ASPM for now.
 404         */
 405        list_for_each_entry(child, &linkbus->devices, bus_list) {
 406                if (child->pcie_type == PCI_EXP_TYPE_PCI_BRIDGE) {
 407                        link->aspm_disable = ASPM_STATE_ALL;
 408                        break;
 409                }
 410        }
 411
 412        /* Get and check endpoint acceptable latencies */
 413        list_for_each_entry(child, &linkbus->devices, bus_list) {
 414                int pos;
 415                u32 reg32, encoding;
 416                struct aspm_latency *acceptable =
 417                        &link->acceptable[PCI_FUNC(child->devfn)];
 418
 419                if (child->pcie_type != PCI_EXP_TYPE_ENDPOINT &&
 420                    child->pcie_type != PCI_EXP_TYPE_LEG_END)
 421                        continue;
 422
 423                pos = pci_pcie_cap(child);
 424                pci_read_config_dword(child, pos + PCI_EXP_DEVCAP, &reg32);
 425                /* Calculate endpoint L0s acceptable latency */
 426                encoding = (reg32 & PCI_EXP_DEVCAP_L0S) >> 6;
 427                acceptable->l0s = calc_l0s_acceptable(encoding);
 428                /* Calculate endpoint L1 acceptable latency */
 429                encoding = (reg32 & PCI_EXP_DEVCAP_L1) >> 9;
 430                acceptable->l1 = calc_l1_acceptable(encoding);
 431
 432                pcie_aspm_check_latency(child);
 433        }
 434}
 435
 436static void pcie_config_aspm_dev(struct pci_dev *pdev, u32 val)
 437{
 438        u16 reg16;
 439        int pos = pci_pcie_cap(pdev);
 440
 441        pci_read_config_word(pdev, pos + PCI_EXP_LNKCTL, &reg16);
 442        reg16 &= ~0x3;
 443        reg16 |= val;
 444        pci_write_config_word(pdev, pos + PCI_EXP_LNKCTL, reg16);
 445}
 446
 447static void pcie_config_aspm_link(struct pcie_link_state *link, u32 state)
 448{
 449        u32 upstream = 0, dwstream = 0;
 450        struct pci_dev *child, *parent = link->pdev;
 451        struct pci_bus *linkbus = parent->subordinate;
 452
 453        /* Nothing to do if the link is already in the requested state */
 454        state &= (link->aspm_capable & ~link->aspm_disable);
 455        if (link->aspm_enabled == state)
 456                return;
 457        /* Convert ASPM state to upstream/downstream ASPM register state */
 458        if (state & ASPM_STATE_L0S_UP)
 459                dwstream |= PCIE_LINK_STATE_L0S;
 460        if (state & ASPM_STATE_L0S_DW)
 461                upstream |= PCIE_LINK_STATE_L0S;
 462        if (state & ASPM_STATE_L1) {
 463                upstream |= PCIE_LINK_STATE_L1;
 464                dwstream |= PCIE_LINK_STATE_L1;
 465        }
 466        /*
 467         * Spec 2.0 suggests all functions should be configured the
 468         * same setting for ASPM. Enabling ASPM L1 should be done in
 469         * upstream component first and then downstream, and vice
 470         * versa for disabling ASPM L1. Spec doesn't mention L0S.
 471         */
 472        if (state & ASPM_STATE_L1)
 473                pcie_config_aspm_dev(parent, upstream);
 474        list_for_each_entry(child, &linkbus->devices, bus_list)
 475                pcie_config_aspm_dev(child, dwstream);
 476        if (!(state & ASPM_STATE_L1))
 477                pcie_config_aspm_dev(parent, upstream);
 478
 479        link->aspm_enabled = state;
 480}
 481
 482static void pcie_config_aspm_path(struct pcie_link_state *link)
 483{
 484        while (link) {
 485                pcie_config_aspm_link(link, policy_to_aspm_state(link));
 486                link = link->parent;
 487        }
 488}
 489
 490static void free_link_state(struct pcie_link_state *link)
 491{
 492        link->pdev->link_state = NULL;
 493        kfree(link);
 494}
 495
 496static int pcie_aspm_sanity_check(struct pci_dev *pdev)
 497{
 498        struct pci_dev *child;
 499        int pos;
 500        u32 reg32;
 501
 502        if (aspm_clear_state)
 503                return -EINVAL;
 504
 505        /*
 506         * Some functions in a slot might not all be PCIe functions,
 507         * very strange. Disable ASPM for the whole slot
 508         */
 509        list_for_each_entry(child, &pdev->subordinate->devices, bus_list) {
 510                pos = pci_pcie_cap(child);
 511                if (!pos)
 512                        return -EINVAL;
 513                /*
 514                 * Disable ASPM for pre-1.1 PCIe device, we follow MS to use
 515                 * RBER bit to determine if a function is 1.1 version device
 516                 */
 517                pci_read_config_dword(child, pos + PCI_EXP_DEVCAP, &reg32);
 518                if (!(reg32 & PCI_EXP_DEVCAP_RBER) && !aspm_force) {
 519                        dev_printk(KERN_INFO, &child->dev, "disabling ASPM"
 520                                " on pre-1.1 PCIe device.  You can enable it"
 521                                " with 'pcie_aspm=force'\n");
 522                        return -EINVAL;
 523                }
 524        }
 525        return 0;
 526}
 527
 528static struct pcie_link_state *alloc_pcie_link_state(struct pci_dev *pdev)
 529{
 530        struct pcie_link_state *link;
 531
 532        link = kzalloc(sizeof(*link), GFP_KERNEL);
 533        if (!link)
 534                return NULL;
 535        INIT_LIST_HEAD(&link->sibling);
 536        INIT_LIST_HEAD(&link->children);
 537        INIT_LIST_HEAD(&link->link);
 538        link->pdev = pdev;
 539        if (pdev->pcie_type == PCI_EXP_TYPE_DOWNSTREAM) {
 540                struct pcie_link_state *parent;
 541                parent = pdev->bus->parent->self->link_state;
 542                if (!parent) {
 543                        kfree(link);
 544                        return NULL;
 545                }
 546                link->parent = parent;
 547                list_add(&link->link, &parent->children);
 548        }
 549        /* Setup a pointer to the root port link */
 550        if (!link->parent)
 551                link->root = link;
 552        else
 553                link->root = link->parent->root;
 554
 555        list_add(&link->sibling, &link_list);
 556        pdev->link_state = link;
 557        return link;
 558}
 559
 560/*
 561 * pcie_aspm_init_link_state: Initiate PCI express link state.
 562 * It is called after the pcie and its children devices are scaned.
 563 * @pdev: the root port or switch downstream port
 564 */
 565void pcie_aspm_init_link_state(struct pci_dev *pdev)
 566{
 567        struct pcie_link_state *link;
 568        int blacklist = !!pcie_aspm_sanity_check(pdev);
 569
 570        if (!pci_is_pcie(pdev) || pdev->link_state)
 571                return;
 572        if (pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
 573            pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM)
 574                return;
 575
 576        if (aspm_disabled && !aspm_clear_state)
 577                return;
 578
 579        /* VIA has a strange chipset, root port is under a bridge */
 580        if (pdev->pcie_type == PCI_EXP_TYPE_ROOT_PORT &&
 581            pdev->bus->self)
 582                return;
 583
 584        down_read(&pci_bus_sem);
 585        if (list_empty(&pdev->subordinate->devices))
 586                goto out;
 587
 588        mutex_lock(&aspm_lock);
 589        link = alloc_pcie_link_state(pdev);
 590        if (!link)
 591                goto unlock;
 592        /*
 593         * Setup initial ASPM state. Note that we need to configure
 594         * upstream links also because capable state of them can be
 595         * update through pcie_aspm_cap_init().
 596         */
 597        pcie_aspm_cap_init(link, blacklist);
 598
 599        /* Setup initial Clock PM state */
 600        pcie_clkpm_cap_init(link, blacklist);
 601
 602        /*
 603         * At this stage drivers haven't had an opportunity to change the
 604         * link policy setting. Enabling ASPM on broken hardware can cripple
 605         * it even before the driver has had a chance to disable ASPM, so
 606         * default to a safe level right now. If we're enabling ASPM beyond
 607         * the BIOS's expectation, we'll do so once pci_enable_device() is
 608         * called.
 609         */
 610        if (aspm_policy != POLICY_POWERSAVE) {
 611                pcie_config_aspm_path(link);
 612                pcie_set_clkpm(link, policy_to_clkpm_state(link));
 613        }
 614
 615unlock:
 616        mutex_unlock(&aspm_lock);
 617out:
 618        up_read(&pci_bus_sem);
 619}
 620
 621/* Recheck latencies and update aspm_capable for links under the root */
 622static void pcie_update_aspm_capable(struct pcie_link_state *root)
 623{
 624        struct pcie_link_state *link;
 625        BUG_ON(root->parent);
 626        list_for_each_entry(link, &link_list, sibling) {
 627                if (link->root != root)
 628                        continue;
 629                link->aspm_capable = link->aspm_support;
 630        }
 631        list_for_each_entry(link, &link_list, sibling) {
 632                struct pci_dev *child;
 633                struct pci_bus *linkbus = link->pdev->subordinate;
 634                if (link->root != root)
 635                        continue;
 636                list_for_each_entry(child, &linkbus->devices, bus_list) {
 637                        if ((child->pcie_type != PCI_EXP_TYPE_ENDPOINT) &&
 638                            (child->pcie_type != PCI_EXP_TYPE_LEG_END))
 639                                continue;
 640                        pcie_aspm_check_latency(child);
 641                }
 642        }
 643}
 644
 645/* @pdev: the endpoint device */
 646void pcie_aspm_exit_link_state(struct pci_dev *pdev)
 647{
 648        struct pci_dev *parent = pdev->bus->self;
 649        struct pcie_link_state *link, *root, *parent_link;
 650
 651        if ((aspm_disabled && !aspm_clear_state) || !pci_is_pcie(pdev) ||
 652            !parent || !parent->link_state)
 653                return;
 654        if ((parent->pcie_type != PCI_EXP_TYPE_ROOT_PORT) &&
 655            (parent->pcie_type != PCI_EXP_TYPE_DOWNSTREAM))
 656                return;
 657
 658        down_read(&pci_bus_sem);
 659        mutex_lock(&aspm_lock);
 660        /*
 661         * All PCIe functions are in one slot, remove one function will remove
 662         * the whole slot, so just wait until we are the last function left.
 663         */
 664        if (!list_is_last(&pdev->bus_list, &parent->subordinate->devices))
 665                goto out;
 666
 667        link = parent->link_state;
 668        root = link->root;
 669        parent_link = link->parent;
 670
 671        /* All functions are removed, so just disable ASPM for the link */
 672        pcie_config_aspm_link(link, 0);
 673        list_del(&link->sibling);
 674        list_del(&link->link);
 675        /* Clock PM is for endpoint device */
 676        free_link_state(link);
 677
 678        /* Recheck latencies and configure upstream links */
 679        if (parent_link) {
 680                pcie_update_aspm_capable(root);
 681                pcie_config_aspm_path(parent_link);
 682        }
 683out:
 684        mutex_unlock(&aspm_lock);
 685        up_read(&pci_bus_sem);
 686}
 687
 688/* @pdev: the root port or switch downstream port */
 689void pcie_aspm_pm_state_change(struct pci_dev *pdev)
 690{
 691        struct pcie_link_state *link = pdev->link_state;
 692
 693        if (aspm_disabled || !pci_is_pcie(pdev) || !link)
 694                return;
 695        if ((pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT) &&
 696            (pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM))
 697                return;
 698        /*
 699         * Devices changed PM state, we should recheck if latency
 700         * meets all functions' requirement
 701         */
 702        down_read(&pci_bus_sem);
 703        mutex_lock(&aspm_lock);
 704        pcie_update_aspm_capable(link->root);
 705        pcie_config_aspm_path(link);
 706        mutex_unlock(&aspm_lock);
 707        up_read(&pci_bus_sem);
 708}
 709
 710/*
 711 * pci_disable_link_state - disable pci device's link state, so the link will
 712 * never enter specific states
 713 */
 714void pci_disable_link_state(struct pci_dev *pdev, int state)
 715{
 716        struct pci_dev *parent = pdev->bus->self;
 717        struct pcie_link_state *link;
 718
 719        if (aspm_disabled || !pci_is_pcie(pdev))
 720                return;
 721        if (pdev->pcie_type == PCI_EXP_TYPE_ROOT_PORT ||
 722            pdev->pcie_type == PCI_EXP_TYPE_DOWNSTREAM)
 723                parent = pdev;
 724        if (!parent || !parent->link_state)
 725                return;
 726
 727        down_read(&pci_bus_sem);
 728        mutex_lock(&aspm_lock);
 729        link = parent->link_state;
 730        if (state & PCIE_LINK_STATE_L0S)
 731                link->aspm_disable |= ASPM_STATE_L0S;
 732        if (state & PCIE_LINK_STATE_L1)
 733                link->aspm_disable |= ASPM_STATE_L1;
 734        pcie_config_aspm_link(link, policy_to_aspm_state(link));
 735
 736        if (state & PCIE_LINK_STATE_CLKPM) {
 737                link->clkpm_capable = 0;
 738                pcie_set_clkpm(link, 0);
 739        }
 740        mutex_unlock(&aspm_lock);
 741        up_read(&pci_bus_sem);
 742}
 743EXPORT_SYMBOL(pci_disable_link_state);
 744
 745static int pcie_aspm_set_policy(const char *val, struct kernel_param *kp)
 746{
 747        int i;
 748        struct pcie_link_state *link;
 749
 750        for (i = 0; i < ARRAY_SIZE(policy_str); i++)
 751                if (!strncmp(val, policy_str[i], strlen(policy_str[i])))
 752                        break;
 753        if (i >= ARRAY_SIZE(policy_str))
 754                return -EINVAL;
 755        if (i == aspm_policy)
 756                return 0;
 757
 758        down_read(&pci_bus_sem);
 759        mutex_lock(&aspm_lock);
 760        aspm_policy = i;
 761        list_for_each_entry(link, &link_list, sibling) {
 762                pcie_config_aspm_link(link, policy_to_aspm_state(link));
 763                pcie_set_clkpm(link, policy_to_clkpm_state(link));
 764        }
 765        mutex_unlock(&aspm_lock);
 766        up_read(&pci_bus_sem);
 767        return 0;
 768}
 769
 770static int pcie_aspm_get_policy(char *buffer, struct kernel_param *kp)
 771{
 772        int i, cnt = 0;
 773        for (i = 0; i < ARRAY_SIZE(policy_str); i++)
 774                if (i == aspm_policy)
 775                        cnt += sprintf(buffer + cnt, "[%s] ", policy_str[i]);
 776                else
 777                        cnt += sprintf(buffer + cnt, "%s ", policy_str[i]);
 778        return cnt;
 779}
 780
 781module_param_call(policy, pcie_aspm_set_policy, pcie_aspm_get_policy,
 782        NULL, 0644);
 783
 784#ifdef CONFIG_PCIEASPM_DEBUG
 785static ssize_t link_state_show(struct device *dev,
 786                struct device_attribute *attr,
 787                char *buf)
 788{
 789        struct pci_dev *pci_device = to_pci_dev(dev);
 790        struct pcie_link_state *link_state = pci_device->link_state;
 791
 792        return sprintf(buf, "%d\n", link_state->aspm_enabled);
 793}
 794
 795static ssize_t link_state_store(struct device *dev,
 796                struct device_attribute *attr,
 797                const char *buf,
 798                size_t n)
 799{
 800        struct pci_dev *pdev = to_pci_dev(dev);
 801        struct pcie_link_state *link, *root = pdev->link_state->root;
 802        u32 val = buf[0] - '0', state = 0;
 803
 804        if (n < 1 || val > 3)
 805                return -EINVAL;
 806
 807        /* Convert requested state to ASPM state */
 808        if (val & PCIE_LINK_STATE_L0S)
 809                state |= ASPM_STATE_L0S;
 810        if (val & PCIE_LINK_STATE_L1)
 811                state |= ASPM_STATE_L1;
 812
 813        down_read(&pci_bus_sem);
 814        mutex_lock(&aspm_lock);
 815        list_for_each_entry(link, &link_list, sibling) {
 816                if (link->root != root)
 817                        continue;
 818                pcie_config_aspm_link(link, state);
 819        }
 820        mutex_unlock(&aspm_lock);
 821        up_read(&pci_bus_sem);
 822        return n;
 823}
 824
 825static ssize_t clk_ctl_show(struct device *dev,
 826                struct device_attribute *attr,
 827                char *buf)
 828{
 829        struct pci_dev *pci_device = to_pci_dev(dev);
 830        struct pcie_link_state *link_state = pci_device->link_state;
 831
 832        return sprintf(buf, "%d\n", link_state->clkpm_enabled);
 833}
 834
 835static ssize_t clk_ctl_store(struct device *dev,
 836                struct device_attribute *attr,
 837                const char *buf,
 838                size_t n)
 839{
 840        struct pci_dev *pdev = to_pci_dev(dev);
 841        int state;
 842
 843        if (n < 1)
 844                return -EINVAL;
 845        state = buf[0]-'0';
 846
 847        down_read(&pci_bus_sem);
 848        mutex_lock(&aspm_lock);
 849        pcie_set_clkpm_nocheck(pdev->link_state, !!state);
 850        mutex_unlock(&aspm_lock);
 851        up_read(&pci_bus_sem);
 852
 853        return n;
 854}
 855
 856static DEVICE_ATTR(link_state, 0644, link_state_show, link_state_store);
 857static DEVICE_ATTR(clk_ctl, 0644, clk_ctl_show, clk_ctl_store);
 858
 859static char power_group[] = "power";
 860void pcie_aspm_create_sysfs_dev_files(struct pci_dev *pdev)
 861{
 862        struct pcie_link_state *link_state = pdev->link_state;
 863
 864        if (!pci_is_pcie(pdev) ||
 865            (pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
 866             pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM) || !link_state)
 867                return;
 868
 869        if (link_state->aspm_support)
 870                sysfs_add_file_to_group(&pdev->dev.kobj,
 871                        &dev_attr_link_state.attr, power_group);
 872        if (link_state->clkpm_capable)
 873                sysfs_add_file_to_group(&pdev->dev.kobj,
 874                        &dev_attr_clk_ctl.attr, power_group);
 875}
 876
 877void pcie_aspm_remove_sysfs_dev_files(struct pci_dev *pdev)
 878{
 879        struct pcie_link_state *link_state = pdev->link_state;
 880
 881        if (!pci_is_pcie(pdev) ||
 882            (pdev->pcie_type != PCI_EXP_TYPE_ROOT_PORT &&
 883             pdev->pcie_type != PCI_EXP_TYPE_DOWNSTREAM) || !link_state)
 884                return;
 885
 886        if (link_state->aspm_support)
 887                sysfs_remove_file_from_group(&pdev->dev.kobj,
 888                        &dev_attr_link_state.attr, power_group);
 889        if (link_state->clkpm_capable)
 890                sysfs_remove_file_from_group(&pdev->dev.kobj,
 891                        &dev_attr_clk_ctl.attr, power_group);
 892}
 893#endif
 894
 895static int __init pcie_aspm_disable(char *str)
 896{
 897        if (!strcmp(str, "off")) {
 898                aspm_disabled = 1;
 899                printk(KERN_INFO "PCIe ASPM is disabled\n");
 900        } else if (!strcmp(str, "force")) {
 901                aspm_force = 1;
 902                printk(KERN_INFO "PCIe ASPM is forcedly enabled\n");
 903        }
 904        return 1;
 905}
 906
 907__setup("pcie_aspm=", pcie_aspm_disable);
 908
 909void pcie_clear_aspm(void)
 910{
 911        if (!aspm_force)
 912                aspm_clear_state = 1;
 913}
 914
 915void pcie_no_aspm(void)
 916{
 917        if (!aspm_force)
 918                aspm_disabled = 1;
 919}
 920
 921/**
 922 * pcie_aspm_enabled - is PCIe ASPM enabled?
 923 *
 924 * Returns true if ASPM has not been disabled by the command-line option
 925 * pcie_aspm=off.
 926 **/
 927int pcie_aspm_enabled(void)
 928{
 929       return !aspm_disabled;
 930}
 931EXPORT_SYMBOL(pcie_aspm_enabled);
 932
 933