linux/arch/powerpc/kernel/head_64.S
<<
>>
Prefs
   1/* SPDX-License-Identifier: GPL-2.0-or-later */
   2/*
   3 *  PowerPC version
   4 *    Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
   5 *
   6 *  Rewritten by Cort Dougan (cort@cs.nmt.edu) for PReP
   7 *    Copyright (C) 1996 Cort Dougan <cort@cs.nmt.edu>
   8 *  Adapted for Power Macintosh by Paul Mackerras.
   9 *  Low-level exception handlers and MMU support
  10 *  rewritten by Paul Mackerras.
  11 *    Copyright (C) 1996 Paul Mackerras.
  12 *
  13 *  Adapted for 64bit PowerPC by Dave Engebretsen, Peter Bergner, and
  14 *    Mike Corrigan {engebret|bergner|mikejc}@us.ibm.com
  15 *
  16 *  This file contains the entry point for the 64-bit kernel along
  17 *  with some early initialization code common to all 64-bit powerpc
  18 *  variants.
  19 */
  20
  21#include <linux/threads.h>
  22#include <linux/init.h>
  23#include <asm/reg.h>
  24#include <asm/page.h>
  25#include <asm/mmu.h>
  26#include <asm/ppc_asm.h>
  27#include <asm/head-64.h>
  28#include <asm/asm-offsets.h>
  29#include <asm/bug.h>
  30#include <asm/cputable.h>
  31#include <asm/setup.h>
  32#include <asm/hvcall.h>
  33#include <asm/thread_info.h>
  34#include <asm/firmware.h>
  35#include <asm/page_64.h>
  36#include <asm/irqflags.h>
  37#include <asm/kvm_book3s_asm.h>
  38#include <asm/ptrace.h>
  39#include <asm/hw_irq.h>
  40#include <asm/cputhreads.h>
  41#include <asm/ppc-opcode.h>
  42#include <asm/export.h>
  43#include <asm/feature-fixups.h>
  44
  45/* The physical memory is laid out such that the secondary processor
  46 * spin code sits at 0x0000...0x00ff. On server, the vectors follow
  47 * using the layout described in exceptions-64s.S
  48 */
  49
  50/*
  51 * Entering into this code we make the following assumptions:
  52 *
  53 *  For pSeries or server processors:
  54 *   1. The MMU is off & open firmware is running in real mode.
  55 *   2. The primary CPU enters at __start.
  56 *   3. If the RTAS supports "query-cpu-stopped-state", then secondary
  57 *      CPUs will enter as directed by "start-cpu" RTAS call, which is
  58 *      generic_secondary_smp_init, with PIR in r3.
  59 *   4. Else the secondary CPUs will enter at secondary_hold (0x60) as
  60 *      directed by the "start-cpu" RTS call, with PIR in r3.
  61 * -or- For OPAL entry:
  62 *   1. The MMU is off, processor in HV mode.
  63 *   2. The primary CPU enters at 0 with device-tree in r3, OPAL base
  64 *      in r8, and entry in r9 for debugging purposes.
  65 *   3. Secondary CPUs enter as directed by OPAL_START_CPU call, which
  66 *      is at generic_secondary_smp_init, with PIR in r3.
  67 *
  68 *  For Book3E processors:
  69 *   1. The MMU is on running in AS0 in a state defined in ePAPR
  70 *   2. The kernel is entered at __start
  71 */
  72
  73OPEN_FIXED_SECTION(first_256B, 0x0, 0x100)
  74USE_FIXED_SECTION(first_256B)
  75        /*
  76         * Offsets are relative from the start of fixed section, and
  77         * first_256B starts at 0. Offsets are a bit easier to use here
  78         * than the fixed section entry macros.
  79         */
  80        . = 0x0
  81_GLOBAL(__start)
  82        /* NOP this out unconditionally */
  83BEGIN_FTR_SECTION
  84        FIXUP_ENDIAN
  85        b       __start_initialization_multiplatform
  86END_FTR_SECTION(0, 1)
  87
  88        /* Catch branch to 0 in real mode */
  89        trap
  90
  91        /* Secondary processors spin on this value until it becomes non-zero.
  92         * When non-zero, it contains the real address of the function the cpu
  93         * should jump to.
  94         */
  95        .balign 8
  96        .globl  __secondary_hold_spinloop
  97__secondary_hold_spinloop:
  98        .8byte  0x0
  99
 100        /* Secondary processors write this value with their cpu # */
 101        /* after they enter the spin loop immediately below.      */
 102        .globl  __secondary_hold_acknowledge
 103__secondary_hold_acknowledge:
 104        .8byte  0x0
 105
 106#ifdef CONFIG_RELOCATABLE
 107        /* This flag is set to 1 by a loader if the kernel should run
 108         * at the loaded address instead of the linked address.  This
 109         * is used by kexec-tools to keep the the kdump kernel in the
 110         * crash_kernel region.  The loader is responsible for
 111         * observing the alignment requirement.
 112         */
 113
 114#ifdef CONFIG_RELOCATABLE_TEST
 115#define RUN_AT_LOAD_DEFAULT 1           /* Test relocation, do not copy to 0 */
 116#else
 117#define RUN_AT_LOAD_DEFAULT 0x72756e30  /* "run0" -- relocate to 0 by default */
 118#endif
 119
 120        /* Do not move this variable as kexec-tools knows about it. */
 121        . = 0x5c
 122        .globl  __run_at_load
 123__run_at_load:
 124DEFINE_FIXED_SYMBOL(__run_at_load)
 125        .long   RUN_AT_LOAD_DEFAULT
 126#endif
 127
 128        . = 0x60
 129/*
 130 * The following code is used to hold secondary processors
 131 * in a spin loop after they have entered the kernel, but
 132 * before the bulk of the kernel has been relocated.  This code
 133 * is relocated to physical address 0x60 before prom_init is run.
 134 * All of it must fit below the first exception vector at 0x100.
 135 * Use .globl here not _GLOBAL because we want __secondary_hold
 136 * to be the actual text address, not a descriptor.
 137 */
 138        .globl  __secondary_hold
 139__secondary_hold:
 140        FIXUP_ENDIAN
 141#ifndef CONFIG_PPC_BOOK3E
 142        mfmsr   r24
 143        ori     r24,r24,MSR_RI
 144        mtmsrd  r24                     /* RI on */
 145#endif
 146        /* Grab our physical cpu number */
 147        mr      r24,r3
 148        /* stash r4 for book3e */
 149        mr      r25,r4
 150
 151        /* Tell the master cpu we're here */
 152        /* Relocation is off & we are located at an address less */
 153        /* than 0x100, so only need to grab low order offset.    */
 154        std     r24,(ABS_ADDR(__secondary_hold_acknowledge))(0)
 155        sync
 156
 157        li      r26,0
 158#ifdef CONFIG_PPC_BOOK3E
 159        tovirt(r26,r26)
 160#endif
 161        /* All secondary cpus wait here until told to start. */
 162100:    ld      r12,(ABS_ADDR(__secondary_hold_spinloop))(r26)
 163        cmpdi   0,r12,0
 164        beq     100b
 165
 166#if defined(CONFIG_SMP) || defined(CONFIG_KEXEC_CORE)
 167#ifdef CONFIG_PPC_BOOK3E
 168        tovirt(r12,r12)
 169#endif
 170        mtctr   r12
 171        mr      r3,r24
 172        /*
 173         * it may be the case that other platforms have r4 right to
 174         * begin with, this gives us some safety in case it is not
 175         */
 176#ifdef CONFIG_PPC_BOOK3E
 177        mr      r4,r25
 178#else
 179        li      r4,0
 180#endif
 181        /* Make sure that patched code is visible */
 182        isync
 183        bctr
 184#else
 1850:      trap
 186        EMIT_BUG_ENTRY 0b, __FILE__, __LINE__, 0
 187#endif
 188CLOSE_FIXED_SECTION(first_256B)
 189
 190/* This value is used to mark exception frames on the stack. */
 191        .section ".toc","aw"
 192exception_marker:
 193        .tc     ID_72656773_68657265[TC],0x7265677368657265
 194        .previous
 195
 196/*
 197 * On server, we include the exception vectors code here as it
 198 * relies on absolute addressing which is only possible within
 199 * this compilation unit
 200 */
 201#ifdef CONFIG_PPC_BOOK3S
 202#include "exceptions-64s.S"
 203#else
 204OPEN_TEXT_SECTION(0x100)
 205#endif
 206
 207USE_TEXT_SECTION()
 208
 209#ifdef CONFIG_PPC_BOOK3E
 210/*
 211 * The booting_thread_hwid holds the thread id we want to boot in cpu
 212 * hotplug case. It is set by cpu hotplug code, and is invalid by default.
 213 * The thread id is the same as the initial value of SPRN_PIR[THREAD_ID]
 214 * bit field.
 215 */
 216        .globl  booting_thread_hwid
 217booting_thread_hwid:
 218        .long  INVALID_THREAD_HWID
 219        .align 3
 220/*
 221 * start a thread in the same core
 222 * input parameters:
 223 * r3 = the thread physical id
 224 * r4 = the entry point where thread starts
 225 */
 226_GLOBAL(book3e_start_thread)
 227        LOAD_REG_IMMEDIATE(r5, MSR_KERNEL)
 228        cmpwi   r3, 0
 229        beq     10f
 230        cmpwi   r3, 1
 231        beq     11f
 232        /* If the thread id is invalid, just exit. */
 233        b       13f
 23410:
 235        MTTMR(TMRN_IMSR0, 5)
 236        MTTMR(TMRN_INIA0, 4)
 237        b       12f
 23811:
 239        MTTMR(TMRN_IMSR1, 5)
 240        MTTMR(TMRN_INIA1, 4)
 24112:
 242        isync
 243        li      r6, 1
 244        sld     r6, r6, r3
 245        mtspr   SPRN_TENS, r6
 24613:
 247        blr
 248
 249/*
 250 * stop a thread in the same core
 251 * input parameter:
 252 * r3 = the thread physical id
 253 */
 254_GLOBAL(book3e_stop_thread)
 255        cmpwi   r3, 0
 256        beq     10f
 257        cmpwi   r3, 1
 258        beq     10f
 259        /* If the thread id is invalid, just exit. */
 260        b       13f
 26110:
 262        li      r4, 1
 263        sld     r4, r4, r3
 264        mtspr   SPRN_TENC, r4
 26513:
 266        blr
 267
 268_GLOBAL(fsl_secondary_thread_init)
 269        mfspr   r4,SPRN_BUCSR
 270
 271        /* Enable branch prediction */
 272        lis     r3,BUCSR_INIT@h
 273        ori     r3,r3,BUCSR_INIT@l
 274        mtspr   SPRN_BUCSR,r3
 275        isync
 276
 277        /*
 278         * Fix PIR to match the linear numbering in the device tree.
 279         *
 280         * On e6500, the reset value of PIR uses the low three bits for
 281         * the thread within a core, and the upper bits for the core
 282         * number.  There are two threads per core, so shift everything
 283         * but the low bit right by two bits so that the cpu numbering is
 284         * continuous.
 285         *
 286         * If the old value of BUCSR is non-zero, this thread has run
 287         * before.  Thus, we assume we are coming from kexec or a similar
 288         * scenario, and PIR is already set to the correct value.  This
 289         * is a bit of a hack, but there are limited opportunities for
 290         * getting information into the thread and the alternatives
 291         * seemed like they'd be overkill.  We can't tell just by looking
 292         * at the old PIR value which state it's in, since the same value
 293         * could be valid for one thread out of reset and for a different
 294         * thread in Linux.
 295         */
 296
 297        mfspr   r3, SPRN_PIR
 298        cmpwi   r4,0
 299        bne     1f
 300        rlwimi  r3, r3, 30, 2, 30
 301        mtspr   SPRN_PIR, r3
 3021:
 303#endif
 304
 305_GLOBAL(generic_secondary_thread_init)
 306        mr      r24,r3
 307
 308        /* turn on 64-bit mode */
 309        bl      enable_64b_mode
 310
 311        /* get a valid TOC pointer, wherever we're mapped at */
 312        bl      relative_toc
 313        tovirt(r2,r2)
 314
 315#ifdef CONFIG_PPC_BOOK3E
 316        /* Book3E initialization */
 317        mr      r3,r24
 318        bl      book3e_secondary_thread_init
 319#endif
 320        b       generic_secondary_common_init
 321
 322/*
 323 * On pSeries and most other platforms, secondary processors spin
 324 * in the following code.
 325 * At entry, r3 = this processor's number (physical cpu id)
 326 *
 327 * On Book3E, r4 = 1 to indicate that the initial TLB entry for
 328 * this core already exists (setup via some other mechanism such
 329 * as SCOM before entry).
 330 */
 331_GLOBAL(generic_secondary_smp_init)
 332        FIXUP_ENDIAN
 333        mr      r24,r3
 334        mr      r25,r4
 335
 336        /* turn on 64-bit mode */
 337        bl      enable_64b_mode
 338
 339        /* get a valid TOC pointer, wherever we're mapped at */
 340        bl      relative_toc
 341        tovirt(r2,r2)
 342
 343#ifdef CONFIG_PPC_BOOK3E
 344        /* Book3E initialization */
 345        mr      r3,r24
 346        mr      r4,r25
 347        bl      book3e_secondary_core_init
 348
 349/*
 350 * After common core init has finished, check if the current thread is the
 351 * one we wanted to boot. If not, start the specified thread and stop the
 352 * current thread.
 353 */
 354        LOAD_REG_ADDR(r4, booting_thread_hwid)
 355        lwz     r3, 0(r4)
 356        li      r5, INVALID_THREAD_HWID
 357        cmpw    r3, r5
 358        beq     20f
 359
 360        /*
 361         * The value of booting_thread_hwid has been stored in r3,
 362         * so make it invalid.
 363         */
 364        stw     r5, 0(r4)
 365
 366        /*
 367         * Get the current thread id and check if it is the one we wanted.
 368         * If not, start the one specified in booting_thread_hwid and stop
 369         * the current thread.
 370         */
 371        mfspr   r8, SPRN_TIR
 372        cmpw    r3, r8
 373        beq     20f
 374
 375        /* start the specified thread */
 376        LOAD_REG_ADDR(r5, fsl_secondary_thread_init)
 377        ld      r4, 0(r5)
 378        bl      book3e_start_thread
 379
 380        /* stop the current thread */
 381        mr      r3, r8
 382        bl      book3e_stop_thread
 38310:
 384        b       10b
 38520:
 386#endif
 387
 388generic_secondary_common_init:
 389        /* Set up a paca value for this processor. Since we have the
 390         * physical cpu id in r24, we need to search the pacas to find
 391         * which logical id maps to our physical one.
 392         */
 393#ifndef CONFIG_SMP
 394        b       kexec_wait              /* wait for next kernel if !SMP  */
 395#else
 396        LOAD_REG_ADDR(r8, paca_ptrs)    /* Load paca_ptrs pointe         */
 397        ld      r8,0(r8)                /* Get base vaddr of array       */
 398        LOAD_REG_ADDR(r7, nr_cpu_ids)   /* Load nr_cpu_ids address       */
 399        lwz     r7,0(r7)                /* also the max paca allocated   */
 400        li      r5,0                    /* logical cpu id                */
 4011:
 402        sldi    r9,r5,3                 /* get paca_ptrs[] index from cpu id */
 403        ldx     r13,r9,r8               /* r13 = paca_ptrs[cpu id]       */
 404        lhz     r6,PACAHWCPUID(r13)     /* Load HW procid from paca      */
 405        cmpw    r6,r24                  /* Compare to our id             */
 406        beq     2f
 407        addi    r5,r5,1
 408        cmpw    r5,r7                   /* Check if more pacas exist     */
 409        blt     1b
 410
 411        mr      r3,r24                  /* not found, copy phys to r3    */
 412        b       kexec_wait              /* next kernel might do better   */
 413
 4142:      SET_PACA(r13)
 415#ifdef CONFIG_PPC_BOOK3E
 416        addi    r12,r13,PACA_EXTLB      /* and TLB exc frame in another  */
 417        mtspr   SPRN_SPRG_TLB_EXFRAME,r12
 418#endif
 419
 420        /* From now on, r24 is expected to be logical cpuid */
 421        mr      r24,r5
 422
 423        /* See if we need to call a cpu state restore handler */
 424        LOAD_REG_ADDR(r23, cur_cpu_spec)
 425        ld      r23,0(r23)
 426        ld      r12,CPU_SPEC_RESTORE(r23)
 427        cmpdi   0,r12,0
 428        beq     3f
 429#ifdef PPC64_ELF_ABI_v1
 430        ld      r12,0(r12)
 431#endif
 432        mtctr   r12
 433        bctrl
 434
 4353:      LOAD_REG_ADDR(r3, spinning_secondaries) /* Decrement spinning_secondaries */
 436        lwarx   r4,0,r3
 437        subi    r4,r4,1
 438        stwcx.  r4,0,r3
 439        bne     3b
 440        isync
 441
 4424:      HMT_LOW
 443        lbz     r23,PACAPROCSTART(r13)  /* Test if this processor should */
 444                                        /* start.                        */
 445        cmpwi   0,r23,0
 446        beq     4b                      /* Loop until told to go         */
 447
 448        sync                            /* order paca.run and cur_cpu_spec */
 449        isync                           /* In case code patching happened */
 450
 451        /* Create a temp kernel stack for use before relocation is on.  */
 452        ld      r1,PACAEMERGSP(r13)
 453        subi    r1,r1,STACK_FRAME_OVERHEAD
 454
 455        b       __secondary_start
 456#endif /* SMP */
 457
 458/*
 459 * Turn the MMU off.
 460 * Assumes we're mapped EA == RA if the MMU is on.
 461 */
 462#ifdef CONFIG_PPC_BOOK3S
 463__mmu_off:
 464        mfmsr   r3
 465        andi.   r0,r3,MSR_IR|MSR_DR
 466        beqlr
 467        mflr    r4
 468        andc    r3,r3,r0
 469        mtspr   SPRN_SRR0,r4
 470        mtspr   SPRN_SRR1,r3
 471        sync
 472        rfid
 473        b       .       /* prevent speculative execution */
 474#endif
 475
 476
 477/*
 478 * Here is our main kernel entry point. We support currently 2 kind of entries
 479 * depending on the value of r5.
 480 *
 481 *   r5 != NULL -> OF entry, we go to prom_init, "legacy" parameter content
 482 *                 in r3...r7
 483 *   
 484 *   r5 == NULL -> kexec style entry. r3 is a physical pointer to the
 485 *                 DT block, r4 is a physical pointer to the kernel itself
 486 *
 487 */
 488__start_initialization_multiplatform:
 489        /* Make sure we are running in 64 bits mode */
 490        bl      enable_64b_mode
 491
 492        /* Get TOC pointer (current runtime address) */
 493        bl      relative_toc
 494
 495        /* find out where we are now */
 496        bcl     20,31,$+4
 4970:      mflr    r26                     /* r26 = runtime addr here */
 498        addis   r26,r26,(_stext - 0b)@ha
 499        addi    r26,r26,(_stext - 0b)@l /* current runtime base addr */
 500
 501        /*
 502         * Are we booted from a PROM Of-type client-interface ?
 503         */
 504        cmpldi  cr0,r5,0
 505        beq     1f
 506        b       __boot_from_prom                /* yes -> prom */
 5071:
 508        /* Save parameters */
 509        mr      r31,r3
 510        mr      r30,r4
 511#ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
 512        /* Save OPAL entry */
 513        mr      r28,r8
 514        mr      r29,r9
 515#endif
 516
 517#ifdef CONFIG_PPC_BOOK3E
 518        bl      start_initialization_book3e
 519        b       __after_prom_start
 520#else
 521        /* Setup some critical 970 SPRs before switching MMU off */
 522        mfspr   r0,SPRN_PVR
 523        srwi    r0,r0,16
 524        cmpwi   r0,0x39         /* 970 */
 525        beq     1f
 526        cmpwi   r0,0x3c         /* 970FX */
 527        beq     1f
 528        cmpwi   r0,0x44         /* 970MP */
 529        beq     1f
 530        cmpwi   r0,0x45         /* 970GX */
 531        bne     2f
 5321:      bl      __cpu_preinit_ppc970
 5332:
 534
 535        /* Switch off MMU if not already off */
 536        bl      __mmu_off
 537        b       __after_prom_start
 538#endif /* CONFIG_PPC_BOOK3E */
 539
 540__boot_from_prom:
 541#ifdef CONFIG_PPC_OF_BOOT_TRAMPOLINE
 542        /* Save parameters */
 543        mr      r31,r3
 544        mr      r30,r4
 545        mr      r29,r5
 546        mr      r28,r6
 547        mr      r27,r7
 548
 549        /*
 550         * Align the stack to 16-byte boundary
 551         * Depending on the size and layout of the ELF sections in the initial
 552         * boot binary, the stack pointer may be unaligned on PowerMac
 553         */
 554        rldicr  r1,r1,0,59
 555
 556#ifdef CONFIG_RELOCATABLE
 557        /* Relocate code for where we are now */
 558        mr      r3,r26
 559        bl      relocate
 560#endif
 561
 562        /* Restore parameters */
 563        mr      r3,r31
 564        mr      r4,r30
 565        mr      r5,r29
 566        mr      r6,r28
 567        mr      r7,r27
 568
 569        /* Do all of the interaction with OF client interface */
 570        mr      r8,r26
 571        bl      prom_init
 572#endif /* #CONFIG_PPC_OF_BOOT_TRAMPOLINE */
 573
 574        /* We never return. We also hit that trap if trying to boot
 575         * from OF while CONFIG_PPC_OF_BOOT_TRAMPOLINE isn't selected */
 576        trap
 577
 578__after_prom_start:
 579#ifdef CONFIG_RELOCATABLE
 580        /* process relocations for the final address of the kernel */
 581        lis     r25,PAGE_OFFSET@highest /* compute virtual base of kernel */
 582        sldi    r25,r25,32
 583#if defined(CONFIG_PPC_BOOK3E)
 584        tovirt(r26,r26)         /* on booke, we already run at PAGE_OFFSET */
 585#endif
 586        lwz     r7,(FIXED_SYMBOL_ABS_ADDR(__run_at_load))(r26)
 587#if defined(CONFIG_PPC_BOOK3E)
 588        tophys(r26,r26)
 589#endif
 590        cmplwi  cr0,r7,1        /* flagged to stay where we are ? */
 591        bne     1f
 592        add     r25,r25,r26
 5931:      mr      r3,r25
 594        bl      relocate
 595#if defined(CONFIG_PPC_BOOK3E)
 596        /* IVPR needs to be set after relocation. */
 597        bl      init_core_book3e
 598#endif
 599#endif
 600
 601/*
 602 * We need to run with _stext at physical address PHYSICAL_START.
 603 * This will leave some code in the first 256B of
 604 * real memory, which are reserved for software use.
 605 *
 606 * Note: This process overwrites the OF exception vectors.
 607 */
 608        li      r3,0                    /* target addr */
 609#ifdef CONFIG_PPC_BOOK3E
 610        tovirt(r3,r3)           /* on booke, we already run at PAGE_OFFSET */
 611#endif
 612        mr.     r4,r26                  /* In some cases the loader may  */
 613#if defined(CONFIG_PPC_BOOK3E)
 614        tovirt(r4,r4)
 615#endif
 616        beq     9f                      /* have already put us at zero */
 617        li      r6,0x100                /* Start offset, the first 0x100 */
 618                                        /* bytes were copied earlier.    */
 619
 620#ifdef CONFIG_RELOCATABLE
 621/*
 622 * Check if the kernel has to be running as relocatable kernel based on the
 623 * variable __run_at_load, if it is set the kernel is treated as relocatable
 624 * kernel, otherwise it will be moved to PHYSICAL_START
 625 */
 626#if defined(CONFIG_PPC_BOOK3E)
 627        tovirt(r26,r26)         /* on booke, we already run at PAGE_OFFSET */
 628#endif
 629        lwz     r7,(FIXED_SYMBOL_ABS_ADDR(__run_at_load))(r26)
 630        cmplwi  cr0,r7,1
 631        bne     3f
 632
 633#ifdef CONFIG_PPC_BOOK3E
 634        LOAD_REG_ADDR(r5, __end_interrupts)
 635        LOAD_REG_ADDR(r11, _stext)
 636        sub     r5,r5,r11
 637#else
 638        /* just copy interrupts */
 639        LOAD_REG_IMMEDIATE_SYM(r5, r11, FIXED_SYMBOL_ABS_ADDR(__end_interrupts))
 640#endif
 641        b       5f
 6423:
 643#endif
 644        /* # bytes of memory to copy */
 645        lis     r5,(ABS_ADDR(copy_to_here))@ha
 646        addi    r5,r5,(ABS_ADDR(copy_to_here))@l
 647
 648        bl      copy_and_flush          /* copy the first n bytes        */
 649                                        /* this includes the code being  */
 650                                        /* executed here.                */
 651        /* Jump to the copy of this code that we just made */
 652        addis   r8,r3,(ABS_ADDR(4f))@ha
 653        addi    r12,r8,(ABS_ADDR(4f))@l
 654        mtctr   r12
 655        bctr
 656
 657.balign 8
 658p_end: .8byte _end - copy_to_here
 659
 6604:
 661        /*
 662         * Now copy the rest of the kernel up to _end, add
 663         * _end - copy_to_here to the copy limit and run again.
 664         */
 665        addis   r8,r26,(ABS_ADDR(p_end))@ha
 666        ld      r8,(ABS_ADDR(p_end))@l(r8)
 667        add     r5,r5,r8
 6685:      bl      copy_and_flush          /* copy the rest */
 669
 6709:      b       start_here_multiplatform
 671
 672/*
 673 * Copy routine used to copy the kernel to start at physical address 0
 674 * and flush and invalidate the caches as needed.
 675 * r3 = dest addr, r4 = source addr, r5 = copy limit, r6 = start offset
 676 * on exit, r3, r4, r5 are unchanged, r6 is updated to be >= r5.
 677 *
 678 * Note: this routine *only* clobbers r0, r6 and lr
 679 */
 680_GLOBAL(copy_and_flush)
 681        addi    r5,r5,-8
 682        addi    r6,r6,-8
 6834:      li      r0,8                    /* Use the smallest common      */
 684                                        /* denominator cache line       */
 685                                        /* size.  This results in       */
 686                                        /* extra cache line flushes     */
 687                                        /* but operation is correct.    */
 688                                        /* Can't get cache line size    */
 689                                        /* from NACA as it is being     */
 690                                        /* moved too.                   */
 691
 692        mtctr   r0                      /* put # words/line in ctr      */
 6933:      addi    r6,r6,8                 /* copy a cache line            */
 694        ldx     r0,r6,r4
 695        stdx    r0,r6,r3
 696        bdnz    3b
 697        dcbst   r6,r3                   /* write it to memory           */
 698        sync
 699        icbi    r6,r3                   /* flush the icache line        */
 700        cmpld   0,r6,r5
 701        blt     4b
 702        sync
 703        addi    r5,r5,8
 704        addi    r6,r6,8
 705        isync
 706        blr
 707
 708.align 8
 709copy_to_here:
 710
 711#ifdef CONFIG_SMP
 712#ifdef CONFIG_PPC_PMAC
 713/*
 714 * On PowerMac, secondary processors starts from the reset vector, which
 715 * is temporarily turned into a call to one of the functions below.
 716 */
 717        .section ".text";
 718        .align 2 ;
 719
 720        .globl  __secondary_start_pmac_0
 721__secondary_start_pmac_0:
 722        /* NB the entries for cpus 0, 1, 2 must each occupy 8 bytes. */
 723        li      r24,0
 724        b       1f
 725        li      r24,1
 726        b       1f
 727        li      r24,2
 728        b       1f
 729        li      r24,3
 7301:
 731        
 732_GLOBAL(pmac_secondary_start)
 733        /* turn on 64-bit mode */
 734        bl      enable_64b_mode
 735
 736        li      r0,0
 737        mfspr   r3,SPRN_HID4
 738        rldimi  r3,r0,40,23     /* clear bit 23 (rm_ci) */
 739        sync
 740        mtspr   SPRN_HID4,r3
 741        isync
 742        sync
 743        slbia
 744
 745        /* get TOC pointer (real address) */
 746        bl      relative_toc
 747        tovirt(r2,r2)
 748
 749        /* Copy some CPU settings from CPU 0 */
 750        bl      __restore_cpu_ppc970
 751
 752        /* pSeries do that early though I don't think we really need it */
 753        mfmsr   r3
 754        ori     r3,r3,MSR_RI
 755        mtmsrd  r3                      /* RI on */
 756
 757        /* Set up a paca value for this processor. */
 758        LOAD_REG_ADDR(r4,paca_ptrs)     /* Load paca pointer            */
 759        ld      r4,0(r4)                /* Get base vaddr of paca_ptrs array */
 760        sldi    r5,r24,3                /* get paca_ptrs[] index from cpu id */
 761        ldx     r13,r5,r4               /* r13 = paca_ptrs[cpu id]       */
 762        SET_PACA(r13)                   /* Save vaddr of paca in an SPRG*/
 763
 764        /* Mark interrupts soft and hard disabled (they might be enabled
 765         * in the PACA when doing hotplug)
 766         */
 767        li      r0,IRQS_DISABLED
 768        stb     r0,PACAIRQSOFTMASK(r13)
 769        li      r0,PACA_IRQ_HARD_DIS
 770        stb     r0,PACAIRQHAPPENED(r13)
 771
 772        /* Create a temp kernel stack for use before relocation is on.  */
 773        ld      r1,PACAEMERGSP(r13)
 774        subi    r1,r1,STACK_FRAME_OVERHEAD
 775
 776        b       __secondary_start
 777
 778#endif /* CONFIG_PPC_PMAC */
 779
 780/*
 781 * This function is called after the master CPU has released the
 782 * secondary processors.  The execution environment is relocation off.
 783 * The paca for this processor has the following fields initialized at
 784 * this point:
 785 *   1. Processor number
 786 *   2. Segment table pointer (virtual address)
 787 * On entry the following are set:
 788 *   r1        = stack pointer (real addr of temp stack)
 789 *   r24       = cpu# (in Linux terms)
 790 *   r13       = paca virtual address
 791 *   SPRG_PACA = paca virtual address
 792 */
 793        .section ".text";
 794        .align 2 ;
 795
 796        .globl  __secondary_start
 797__secondary_start:
 798        /* Set thread priority to MEDIUM */
 799        HMT_MEDIUM
 800
 801        /*
 802         * Do early setup for this CPU, in particular initialising the MMU so we
 803         * can turn it on below. This is a call to C, which is OK, we're still
 804         * running on the emergency stack.
 805         */
 806        bl      early_setup_secondary
 807
 808        /*
 809         * The primary has initialized our kernel stack for us in the paca, grab
 810         * it and put it in r1. We must *not* use it until we turn on the MMU
 811         * below, because it may not be inside the RMO.
 812         */
 813        ld      r1, PACAKSAVE(r13)
 814
 815        /* Clear backchain so we get nice backtraces */
 816        li      r7,0
 817        mtlr    r7
 818
 819        /* Mark interrupts soft and hard disabled (they might be enabled
 820         * in the PACA when doing hotplug)
 821         */
 822        li      r7,IRQS_DISABLED
 823        stb     r7,PACAIRQSOFTMASK(r13)
 824        li      r0,PACA_IRQ_HARD_DIS
 825        stb     r0,PACAIRQHAPPENED(r13)
 826
 827        /* enable MMU and jump to start_secondary */
 828        LOAD_REG_ADDR(r3, start_secondary_prolog)
 829        LOAD_REG_IMMEDIATE(r4, MSR_KERNEL)
 830
 831        mtspr   SPRN_SRR0,r3
 832        mtspr   SPRN_SRR1,r4
 833        RFI
 834        b       .       /* prevent speculative execution */
 835
 836/* 
 837 * Running with relocation on at this point.  All we want to do is
 838 * zero the stack back-chain pointer and get the TOC virtual address
 839 * before going into C code.
 840 */
 841start_secondary_prolog:
 842        ld      r2,PACATOC(r13)
 843        li      r3,0
 844        std     r3,0(r1)                /* Zero the stack frame pointer */
 845        bl      start_secondary
 846        b       .
 847/*
 848 * Reset stack pointer and call start_secondary
 849 * to continue with online operation when woken up
 850 * from cede in cpu offline.
 851 */
 852_GLOBAL(start_secondary_resume)
 853        ld      r1,PACAKSAVE(r13)       /* Reload kernel stack pointer */
 854        li      r3,0
 855        std     r3,0(r1)                /* Zero the stack frame pointer */
 856        bl      start_secondary
 857        b       .
 858#endif
 859
 860/*
 861 * This subroutine clobbers r11 and r12
 862 */
 863enable_64b_mode:
 864        mfmsr   r11                     /* grab the current MSR */
 865#ifdef CONFIG_PPC_BOOK3E
 866        oris    r11,r11,0x8000          /* CM bit set, we'll set ICM later */
 867        mtmsr   r11
 868#else /* CONFIG_PPC_BOOK3E */
 869        li      r12,(MSR_64BIT | MSR_ISF)@highest
 870        sldi    r12,r12,48
 871        or      r11,r11,r12
 872        mtmsrd  r11
 873        isync
 874#endif
 875        blr
 876
 877/*
 878 * This puts the TOC pointer into r2, offset by 0x8000 (as expected
 879 * by the toolchain).  It computes the correct value for wherever we
 880 * are running at the moment, using position-independent code.
 881 *
 882 * Note: The compiler constructs pointers using offsets from the
 883 * TOC in -mcmodel=medium mode. After we relocate to 0 but before
 884 * the MMU is on we need our TOC to be a virtual address otherwise
 885 * these pointers will be real addresses which may get stored and
 886 * accessed later with the MMU on. We use tovirt() at the call
 887 * sites to handle this.
 888 */
 889_GLOBAL(relative_toc)
 890        mflr    r0
 891        bcl     20,31,$+4
 8920:      mflr    r11
 893        ld      r2,(p_toc - 0b)(r11)
 894        add     r2,r2,r11
 895        mtlr    r0
 896        blr
 897
 898.balign 8
 899p_toc:  .8byte  __toc_start + 0x8000 - 0b
 900
 901/*
 902 * This is where the main kernel code starts.
 903 */
 904__REF
 905start_here_multiplatform:
 906        /* set up the TOC */
 907        bl      relative_toc
 908        tovirt(r2,r2)
 909
 910        /* Clear out the BSS. It may have been done in prom_init,
 911         * already but that's irrelevant since prom_init will soon
 912         * be detached from the kernel completely. Besides, we need
 913         * to clear it now for kexec-style entry.
 914         */
 915        LOAD_REG_ADDR(r11,__bss_stop)
 916        LOAD_REG_ADDR(r8,__bss_start)
 917        sub     r11,r11,r8              /* bss size                     */
 918        addi    r11,r11,7               /* round up to an even double word */
 919        srdi.   r11,r11,3               /* shift right by 3             */
 920        beq     4f
 921        addi    r8,r8,-8
 922        li      r0,0
 923        mtctr   r11                     /* zero this many doublewords   */
 9243:      stdu    r0,8(r8)
 925        bdnz    3b
 9264:
 927
 928#ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
 929        /* Setup OPAL entry */
 930        LOAD_REG_ADDR(r11, opal)
 931        std     r28,0(r11);
 932        std     r29,8(r11);
 933#endif
 934
 935#ifndef CONFIG_PPC_BOOK3E
 936        mfmsr   r6
 937        ori     r6,r6,MSR_RI
 938        mtmsrd  r6                      /* RI on */
 939#endif
 940
 941#ifdef CONFIG_RELOCATABLE
 942        /* Save the physical address we're running at in kernstart_addr */
 943        LOAD_REG_ADDR(r4, kernstart_addr)
 944        clrldi  r0,r25,2
 945        std     r0,0(r4)
 946#endif
 947
 948        /* The following gets the stack set up with the regs */
 949        /* pointing to the real addr of the kernel stack.  This is   */
 950        /* all done to support the C function call below which sets  */
 951        /* up the htab.  This is done because we have relocated the  */
 952        /* kernel but are still running in real mode. */
 953
 954        LOAD_REG_ADDR(r3,init_thread_union)
 955
 956        /* set up a stack pointer */
 957        LOAD_REG_IMMEDIATE(r1,THREAD_SIZE)
 958        add     r1,r3,r1
 959        li      r0,0
 960        stdu    r0,-STACK_FRAME_OVERHEAD(r1)
 961
 962        /*
 963         * Do very early kernel initializations, including initial hash table
 964         * and SLB setup before we turn on relocation.
 965         */
 966
 967        /* Restore parameters passed from prom_init/kexec */
 968        mr      r3,r31
 969        LOAD_REG_ADDR(r12, DOTSYM(early_setup))
 970        mtctr   r12
 971        bctrl           /* also sets r13 and SPRG_PACA */
 972
 973        LOAD_REG_ADDR(r3, start_here_common)
 974        ld      r4,PACAKMSR(r13)
 975        mtspr   SPRN_SRR0,r3
 976        mtspr   SPRN_SRR1,r4
 977        RFI
 978        b       .       /* prevent speculative execution */
 979
 980        .previous
 981        /* This is where all platforms converge execution */
 982
 983start_here_common:
 984        /* relocation is on at this point */
 985        std     r1,PACAKSAVE(r13)
 986
 987        /* Load the TOC (virtual address) */
 988        ld      r2,PACATOC(r13)
 989
 990        /* Mark interrupts soft and hard disabled (they might be enabled
 991         * in the PACA when doing hotplug)
 992         */
 993        li      r0,IRQS_DISABLED
 994        stb     r0,PACAIRQSOFTMASK(r13)
 995        li      r0,PACA_IRQ_HARD_DIS
 996        stb     r0,PACAIRQHAPPENED(r13)
 997
 998        /* Generic kernel entry */
 999        bl      start_kernel
1000
1001        /* Not reached */
1002        trap
1003        EMIT_BUG_ENTRY 0b, __FILE__, __LINE__, 0
1004
1005/*
1006 * We put a few things here that have to be page-aligned.
1007 * This stuff goes at the beginning of the bss, which is page-aligned.
1008 */
1009        .section ".bss"
1010/*
1011 * pgd dir should be aligned to PGD_TABLE_SIZE which is 64K.
1012 * We will need to find a better way to fix this
1013 */
1014        .align  16
1015
1016        .globl  swapper_pg_dir
1017swapper_pg_dir:
1018        .space  PGD_TABLE_SIZE
1019
1020        .globl  empty_zero_page
1021empty_zero_page:
1022        .space  PAGE_SIZE
1023EXPORT_SYMBOL(empty_zero_page)
1024