linux/arch/powerpc/platforms/powernv/setup.c
<<
>>
Prefs
   1/*
   2 * PowerNV setup code.
   3 *
   4 * Copyright 2011 IBM Corp.
   5 *
   6 * This program is free software; you can redistribute it and/or
   7 * modify it under the terms of the GNU General Public License
   8 * as published by the Free Software Foundation; either version
   9 * 2 of the License, or (at your option) any later version.
  10 */
  11
  12#undef DEBUG
  13
  14#include <linux/cpu.h>
  15#include <linux/errno.h>
  16#include <linux/sched.h>
  17#include <linux/kernel.h>
  18#include <linux/tty.h>
  19#include <linux/reboot.h>
  20#include <linux/init.h>
  21#include <linux/console.h>
  22#include <linux/delay.h>
  23#include <linux/irq.h>
  24#include <linux/seq_file.h>
  25#include <linux/of.h>
  26#include <linux/of_fdt.h>
  27#include <linux/interrupt.h>
  28#include <linux/bug.h>
  29#include <linux/pci.h>
  30#include <linux/cpufreq.h>
  31
  32#include <asm/machdep.h>
  33#include <asm/firmware.h>
  34#include <asm/xics.h>
  35#include <asm/opal.h>
  36#include <asm/kexec.h>
  37#include <asm/smp.h>
  38
  39#include "powernv.h"
  40
  41static void __init pnv_setup_arch(void)
  42{
  43        set_arch_panic_timeout(10, ARCH_PANIC_TIMEOUT);
  44
  45        /* Initialize SMP */
  46        pnv_smp_init();
  47
  48        /* Setup PCI */
  49        pnv_pci_init();
  50
  51        /* Setup RTC and NVRAM callbacks */
  52        if (firmware_has_feature(FW_FEATURE_OPAL))
  53                opal_nvram_init();
  54
  55        /* Enable NAP mode */
  56        powersave_nap = 1;
  57
  58        /* XXX PMCS */
  59}
  60
  61static void __init pnv_init_early(void)
  62{
  63        /*
  64         * Initialize the LPC bus now so that legacy serial
  65         * ports can be found on it
  66         */
  67        opal_lpc_init();
  68
  69#ifdef CONFIG_HVC_OPAL
  70        if (firmware_has_feature(FW_FEATURE_OPAL))
  71                hvc_opal_init_early();
  72        else
  73#endif
  74                add_preferred_console("hvc", 0, NULL);
  75}
  76
  77static void __init pnv_init_IRQ(void)
  78{
  79        xics_init();
  80
  81        WARN_ON(!ppc_md.get_irq);
  82}
  83
  84static void pnv_show_cpuinfo(struct seq_file *m)
  85{
  86        struct device_node *root;
  87        const char *model = "";
  88
  89        root = of_find_node_by_path("/");
  90        if (root)
  91                model = of_get_property(root, "model", NULL);
  92        seq_printf(m, "machine\t\t: PowerNV %s\n", model);
  93        if (firmware_has_feature(FW_FEATURE_OPALv3))
  94                seq_printf(m, "firmware\t: OPAL v3\n");
  95        else if (firmware_has_feature(FW_FEATURE_OPALv2))
  96                seq_printf(m, "firmware\t: OPAL v2\n");
  97        else if (firmware_has_feature(FW_FEATURE_OPAL))
  98                seq_printf(m, "firmware\t: OPAL v1\n");
  99        else
 100                seq_printf(m, "firmware\t: BML\n");
 101        of_node_put(root);
 102}
 103
 104static void pnv_prepare_going_down(void)
 105{
 106        /*
 107         * Disable all notifiers from OPAL, we can't
 108         * service interrupts anymore anyway
 109         */
 110        opal_event_shutdown();
 111
 112        /* Soft disable interrupts */
 113        local_irq_disable();
 114
 115        /*
 116         * Return secondary CPUs to firwmare if a flash update
 117         * is pending otherwise we will get all sort of error
 118         * messages about CPU being stuck etc.. This will also
 119         * have the side effect of hard disabling interrupts so
 120         * past this point, the kernel is effectively dead.
 121         */
 122        opal_flash_term_callback();
 123}
 124
 125static void  __noreturn pnv_restart(char *cmd)
 126{
 127        long rc = OPAL_BUSY;
 128
 129        pnv_prepare_going_down();
 130
 131        while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) {
 132                rc = opal_cec_reboot();
 133                if (rc == OPAL_BUSY_EVENT)
 134                        opal_poll_events(NULL);
 135                else
 136                        mdelay(10);
 137        }
 138        for (;;)
 139                opal_poll_events(NULL);
 140}
 141
 142static void __noreturn pnv_power_off(void)
 143{
 144        long rc = OPAL_BUSY;
 145
 146        pnv_prepare_going_down();
 147
 148        while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) {
 149                rc = opal_cec_power_down(0);
 150                if (rc == OPAL_BUSY_EVENT)
 151                        opal_poll_events(NULL);
 152                else
 153                        mdelay(10);
 154        }
 155        for (;;)
 156                opal_poll_events(NULL);
 157}
 158
 159static void __noreturn pnv_halt(void)
 160{
 161        pnv_power_off();
 162}
 163
 164static void pnv_progress(char *s, unsigned short hex)
 165{
 166}
 167
 168static void pnv_shutdown(void)
 169{
 170        /* Let the PCI code clear up IODA tables */
 171        pnv_pci_shutdown();
 172
 173        /*
 174         * Stop OPAL activity: Unregister all OPAL interrupts so they
 175         * don't fire up while we kexec and make sure all potentially
 176         * DMA'ing ops are complete (such as dump retrieval).
 177         */
 178        opal_shutdown();
 179}
 180
 181#ifdef CONFIG_KEXEC
 182static void pnv_kexec_wait_secondaries_down(void)
 183{
 184        int my_cpu, i, notified = -1;
 185
 186        my_cpu = get_cpu();
 187
 188        for_each_online_cpu(i) {
 189                uint8_t status;
 190                int64_t rc;
 191
 192                if (i == my_cpu)
 193                        continue;
 194
 195                for (;;) {
 196                        rc = opal_query_cpu_status(get_hard_smp_processor_id(i),
 197                                                   &status);
 198                        if (rc != OPAL_SUCCESS || status != OPAL_THREAD_STARTED)
 199                                break;
 200                        barrier();
 201                        if (i != notified) {
 202                                printk(KERN_INFO "kexec: waiting for cpu %d "
 203                                       "(physical %d) to enter OPAL\n",
 204                                       i, paca[i].hw_cpu_id);
 205                                notified = i;
 206                        }
 207                }
 208        }
 209}
 210
 211static void pnv_kexec_cpu_down(int crash_shutdown, int secondary)
 212{
 213        xics_kexec_teardown_cpu(secondary);
 214
 215        /* On OPAL v3, we return all CPUs to firmware */
 216
 217        if (!firmware_has_feature(FW_FEATURE_OPALv3))
 218                return;
 219
 220        if (secondary) {
 221                /* Return secondary CPUs to firmware on OPAL v3 */
 222                mb();
 223                get_paca()->kexec_state = KEXEC_STATE_REAL_MODE;
 224                mb();
 225
 226                /* Return the CPU to OPAL */
 227                opal_return_cpu();
 228        } else if (crash_shutdown) {
 229                /*
 230                 * On crash, we don't wait for secondaries to go
 231                 * down as they might be unreachable or hung, so
 232                 * instead we just wait a bit and move on.
 233                 */
 234                mdelay(1);
 235        } else {
 236                /* Primary waits for the secondaries to have reached OPAL */
 237                pnv_kexec_wait_secondaries_down();
 238
 239                /*
 240                 * We might be running as little-endian - now that interrupts
 241                 * are disabled, reset the HILE bit to big-endian so we don't
 242                 * take interrupts in the wrong endian later
 243                 */
 244                opal_reinit_cpus(OPAL_REINIT_CPUS_HILE_BE);
 245        }
 246}
 247#endif /* CONFIG_KEXEC */
 248
 249#ifdef CONFIG_MEMORY_HOTPLUG_SPARSE
 250static unsigned long pnv_memory_block_size(void)
 251{
 252        return 256UL * 1024 * 1024;
 253}
 254#endif
 255
 256static void __init pnv_setup_machdep_opal(void)
 257{
 258        ppc_md.get_boot_time = opal_get_boot_time;
 259        ppc_md.restart = pnv_restart;
 260        pm_power_off = pnv_power_off;
 261        ppc_md.halt = pnv_halt;
 262        ppc_md.machine_check_exception = opal_machine_check;
 263        ppc_md.mce_check_early_recovery = opal_mce_check_early_recovery;
 264        ppc_md.hmi_exception_early = opal_hmi_exception_early;
 265        ppc_md.handle_hmi_exception = opal_handle_hmi_exception;
 266}
 267
 268static int __init pnv_probe(void)
 269{
 270        unsigned long root = of_get_flat_dt_root();
 271
 272        if (!of_flat_dt_is_compatible(root, "ibm,powernv"))
 273                return 0;
 274
 275        hpte_init_native();
 276
 277        if (firmware_has_feature(FW_FEATURE_OPAL))
 278                pnv_setup_machdep_opal();
 279
 280        pr_debug("PowerNV detected !\n");
 281
 282        return 1;
 283}
 284
 285/*
 286 * Returns the cpu frequency for 'cpu' in Hz. This is used by
 287 * /proc/cpuinfo
 288 */
 289static unsigned long pnv_get_proc_freq(unsigned int cpu)
 290{
 291        unsigned long ret_freq;
 292
 293        ret_freq = cpufreq_quick_get(cpu) * 1000ul;
 294
 295        /*
 296         * If the backend cpufreq driver does not exist,
 297         * then fallback to old way of reporting the clockrate.
 298         */
 299        if (!ret_freq)
 300                ret_freq = ppc_proc_freq;
 301        return ret_freq;
 302}
 303
 304define_machine(powernv) {
 305        .name                   = "PowerNV",
 306        .probe                  = pnv_probe,
 307        .init_early             = pnv_init_early,
 308        .setup_arch             = pnv_setup_arch,
 309        .init_IRQ               = pnv_init_IRQ,
 310        .show_cpuinfo           = pnv_show_cpuinfo,
 311        .get_proc_freq          = pnv_get_proc_freq,
 312        .progress               = pnv_progress,
 313        .machine_shutdown       = pnv_shutdown,
 314        .power_save             = power7_idle,
 315        .calibrate_decr         = generic_calibrate_decr,
 316#ifdef CONFIG_KEXEC
 317        .kexec_cpu_down         = pnv_kexec_cpu_down,
 318#endif
 319#ifdef CONFIG_MEMORY_HOTPLUG_SPARSE
 320        .memory_block_size      = pnv_memory_block_size,
 321#endif
 322};
 323