qemu/target/s390x/mmu_helper.c
<<
>>
Prefs
   1/*
   2 * S390x MMU related functions
   3 *
   4 * Copyright (c) 2011 Alexander Graf
   5 * Copyright (c) 2015 Thomas Huth, IBM Corporation
   6 *
   7 * This program is free software; you can redistribute it and/or modify
   8 * it under the terms of the GNU General Public License as published by
   9 * the Free Software Foundation; either version 2 of the License, or
  10 * (at your option) any later version.
  11 *
  12 * This program is distributed in the hope that it will be useful,
  13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  15 * GNU General Public License for more details.
  16 */
  17
  18#include "qemu/osdep.h"
  19#include "qemu/error-report.h"
  20#include "exec/address-spaces.h"
  21#include "cpu.h"
  22#include "internal.h"
  23#include "kvm_s390x.h"
  24#include "sysemu/kvm.h"
  25#include "sysemu/tcg.h"
  26#include "exec/exec-all.h"
  27#include "trace.h"
  28#include "hw/s390x/storage-keys.h"
  29
  30/* #define DEBUG_S390 */
  31/* #define DEBUG_S390_PTE */
  32/* #define DEBUG_S390_STDOUT */
  33
  34#ifdef DEBUG_S390
  35#ifdef DEBUG_S390_STDOUT
  36#define DPRINTF(fmt, ...) \
  37    do { fprintf(stderr, fmt, ## __VA_ARGS__); \
  38         if (qemu_log_separate()) qemu_log(fmt, ##__VA_ARGS__); } while (0)
  39#else
  40#define DPRINTF(fmt, ...) \
  41    do { qemu_log(fmt, ## __VA_ARGS__); } while (0)
  42#endif
  43#else
  44#define DPRINTF(fmt, ...) \
  45    do { } while (0)
  46#endif
  47
  48#ifdef DEBUG_S390_PTE
  49#define PTE_DPRINTF DPRINTF
  50#else
  51#define PTE_DPRINTF(fmt, ...) \
  52    do { } while (0)
  53#endif
  54
  55/* Fetch/store bits in the translation exception code: */
  56#define FS_READ  0x800
  57#define FS_WRITE 0x400
  58
  59static void trigger_access_exception(CPUS390XState *env, uint32_t type,
  60                                     uint32_t ilen, uint64_t tec)
  61{
  62    S390CPU *cpu = env_archcpu(env);
  63
  64    if (kvm_enabled()) {
  65        kvm_s390_access_exception(cpu, type, tec);
  66    } else {
  67        CPUState *cs = env_cpu(env);
  68        if (type != PGM_ADDRESSING) {
  69            stq_phys(cs->as, env->psa + offsetof(LowCore, trans_exc_code), tec);
  70        }
  71        trigger_pgm_exception(env, type, ilen);
  72    }
  73}
  74
  75static void trigger_prot_fault(CPUS390XState *env, target_ulong vaddr,
  76                               uint64_t asc, int rw, bool exc)
  77{
  78    uint64_t tec;
  79
  80    tec = vaddr | (rw == MMU_DATA_STORE ? FS_WRITE : FS_READ) | 4 | asc >> 46;
  81
  82    DPRINTF("%s: trans_exc_code=%016" PRIx64 "\n", __func__, tec);
  83
  84    if (!exc) {
  85        return;
  86    }
  87
  88    trigger_access_exception(env, PGM_PROTECTION, ILEN_AUTO, tec);
  89}
  90
  91static void trigger_page_fault(CPUS390XState *env, target_ulong vaddr,
  92                               uint32_t type, uint64_t asc, int rw, bool exc)
  93{
  94    int ilen = ILEN_AUTO;
  95    uint64_t tec;
  96
  97    tec = vaddr | (rw == MMU_DATA_STORE ? FS_WRITE : FS_READ) | asc >> 46;
  98
  99    DPRINTF("%s: trans_exc_code=%016" PRIx64 "\n", __func__, tec);
 100
 101    if (!exc) {
 102        return;
 103    }
 104
 105    /* Code accesses have an undefined ilc.  */
 106    if (rw == MMU_INST_FETCH) {
 107        ilen = 2;
 108    }
 109
 110    trigger_access_exception(env, type, ilen, tec);
 111}
 112
 113/* check whether the address would be proteted by Low-Address Protection */
 114static bool is_low_address(uint64_t addr)
 115{
 116    return addr <= 511 || (addr >= 4096 && addr <= 4607);
 117}
 118
 119/* check whether Low-Address Protection is enabled for mmu_translate() */
 120static bool lowprot_enabled(const CPUS390XState *env, uint64_t asc)
 121{
 122    if (!(env->cregs[0] & CR0_LOWPROT)) {
 123        return false;
 124    }
 125    if (!(env->psw.mask & PSW_MASK_DAT)) {
 126        return true;
 127    }
 128
 129    /* Check the private-space control bit */
 130    switch (asc) {
 131    case PSW_ASC_PRIMARY:
 132        return !(env->cregs[1] & ASCE_PRIVATE_SPACE);
 133    case PSW_ASC_SECONDARY:
 134        return !(env->cregs[7] & ASCE_PRIVATE_SPACE);
 135    case PSW_ASC_HOME:
 136        return !(env->cregs[13] & ASCE_PRIVATE_SPACE);
 137    default:
 138        /* We don't support access register mode */
 139        error_report("unsupported addressing mode");
 140        exit(1);
 141    }
 142}
 143
 144/**
 145 * Translate real address to absolute (= physical)
 146 * address by taking care of the prefix mapping.
 147 */
 148target_ulong mmu_real2abs(CPUS390XState *env, target_ulong raddr)
 149{
 150    if (raddr < 0x2000) {
 151        return raddr + env->psa;    /* Map the lowcore. */
 152    } else if (raddr >= env->psa && raddr < env->psa + 0x2000) {
 153        return raddr - env->psa;    /* Map the 0 page. */
 154    }
 155    return raddr;
 156}
 157
 158/* Decode page table entry (normal 4KB page) */
 159static int mmu_translate_pte(CPUS390XState *env, target_ulong vaddr,
 160                             uint64_t asc, uint64_t pt_entry,
 161                             target_ulong *raddr, int *flags, int rw, bool exc)
 162{
 163    if (pt_entry & PAGE_INVALID) {
 164        DPRINTF("%s: PTE=0x%" PRIx64 " invalid\n", __func__, pt_entry);
 165        trigger_page_fault(env, vaddr, PGM_PAGE_TRANS, asc, rw, exc);
 166        return -1;
 167    }
 168    if (pt_entry & PAGE_RES0) {
 169        trigger_page_fault(env, vaddr, PGM_TRANS_SPEC, asc, rw, exc);
 170        return -1;
 171    }
 172    if (pt_entry & PAGE_RO) {
 173        *flags &= ~PAGE_WRITE;
 174    }
 175
 176    *raddr = pt_entry & ASCE_ORIGIN;
 177
 178    PTE_DPRINTF("%s: PTE=0x%" PRIx64 "\n", __func__, pt_entry);
 179
 180    return 0;
 181}
 182
 183/* Decode segment table entry */
 184static int mmu_translate_segment(CPUS390XState *env, target_ulong vaddr,
 185                                 uint64_t asc, uint64_t st_entry,
 186                                 target_ulong *raddr, int *flags, int rw,
 187                                 bool exc)
 188{
 189    CPUState *cs = env_cpu(env);
 190    uint64_t origin, offs, pt_entry;
 191
 192    if (st_entry & SEGMENT_ENTRY_RO) {
 193        *flags &= ~PAGE_WRITE;
 194    }
 195
 196    if ((st_entry & SEGMENT_ENTRY_FC) && (env->cregs[0] & CR0_EDAT)) {
 197        /* Decode EDAT1 segment frame absolute address (1MB page) */
 198        *raddr = (st_entry & 0xfffffffffff00000ULL) | (vaddr & 0xfffff);
 199        PTE_DPRINTF("%s: SEG=0x%" PRIx64 "\n", __func__, st_entry);
 200        return 0;
 201    }
 202
 203    /* Look up 4KB page entry */
 204    origin = st_entry & SEGMENT_ENTRY_ORIGIN;
 205    offs  = (vaddr & VADDR_PX) >> 9;
 206    pt_entry = ldq_phys(cs->as, origin + offs);
 207    PTE_DPRINTF("%s: 0x%" PRIx64 " + 0x%" PRIx64 " => 0x%016" PRIx64 "\n",
 208                __func__, origin, offs, pt_entry);
 209    return mmu_translate_pte(env, vaddr, asc, pt_entry, raddr, flags, rw, exc);
 210}
 211
 212/* Decode region table entries */
 213static int mmu_translate_region(CPUS390XState *env, target_ulong vaddr,
 214                                uint64_t asc, uint64_t entry, int level,
 215                                target_ulong *raddr, int *flags, int rw,
 216                                bool exc)
 217{
 218    CPUState *cs = env_cpu(env);
 219    uint64_t origin, offs, new_entry;
 220    const int pchks[4] = {
 221        PGM_SEGMENT_TRANS, PGM_REG_THIRD_TRANS,
 222        PGM_REG_SEC_TRANS, PGM_REG_FIRST_TRANS
 223    };
 224
 225    PTE_DPRINTF("%s: 0x%" PRIx64 "\n", __func__, entry);
 226
 227    origin = entry & REGION_ENTRY_ORIGIN;
 228    offs = (vaddr >> (17 + 11 * level / 4)) & 0x3ff8;
 229
 230    new_entry = ldq_phys(cs->as, origin + offs);
 231    PTE_DPRINTF("%s: 0x%" PRIx64 " + 0x%" PRIx64 " => 0x%016" PRIx64 "\n",
 232                __func__, origin, offs, new_entry);
 233
 234    if ((new_entry & REGION_ENTRY_INV) != 0) {
 235        DPRINTF("%s: invalid region\n", __func__);
 236        trigger_page_fault(env, vaddr, pchks[level / 4], asc, rw, exc);
 237        return -1;
 238    }
 239
 240    if ((new_entry & REGION_ENTRY_TYPE_MASK) != level) {
 241        trigger_page_fault(env, vaddr, PGM_TRANS_SPEC, asc, rw, exc);
 242        return -1;
 243    }
 244
 245    if (level == ASCE_TYPE_SEGMENT) {
 246        return mmu_translate_segment(env, vaddr, asc, new_entry, raddr, flags,
 247                                     rw, exc);
 248    }
 249
 250    /* Check region table offset and length */
 251    offs = (vaddr >> (28 + 11 * (level - 4) / 4)) & 3;
 252    if (offs < ((new_entry & REGION_ENTRY_TF) >> 6)
 253        || offs > (new_entry & REGION_ENTRY_LENGTH)) {
 254        DPRINTF("%s: invalid offset or len (%lx)\n", __func__, new_entry);
 255        trigger_page_fault(env, vaddr, pchks[level / 4 - 1], asc, rw, exc);
 256        return -1;
 257    }
 258
 259    if ((env->cregs[0] & CR0_EDAT) && (new_entry & REGION_ENTRY_RO)) {
 260        *flags &= ~PAGE_WRITE;
 261    }
 262
 263    /* yet another region */
 264    return mmu_translate_region(env, vaddr, asc, new_entry, level - 4,
 265                                raddr, flags, rw, exc);
 266}
 267
 268static int mmu_translate_asce(CPUS390XState *env, target_ulong vaddr,
 269                              uint64_t asc, uint64_t asce, target_ulong *raddr,
 270                              int *flags, int rw, bool exc)
 271{
 272    int level;
 273    int r;
 274
 275    if (asce & ASCE_REAL_SPACE) {
 276        /* direct mapping */
 277        *raddr = vaddr;
 278        return 0;
 279    }
 280
 281    level = asce & ASCE_TYPE_MASK;
 282    switch (level) {
 283    case ASCE_TYPE_REGION1:
 284        if ((vaddr >> 62) > (asce & ASCE_TABLE_LENGTH)) {
 285            trigger_page_fault(env, vaddr, PGM_REG_FIRST_TRANS, asc, rw, exc);
 286            return -1;
 287        }
 288        break;
 289    case ASCE_TYPE_REGION2:
 290        if (vaddr & 0xffe0000000000000ULL) {
 291            DPRINTF("%s: vaddr doesn't fit 0x%16" PRIx64
 292                    " 0xffe0000000000000ULL\n", __func__, vaddr);
 293            trigger_page_fault(env, vaddr, PGM_ASCE_TYPE, asc, rw, exc);
 294            return -1;
 295        }
 296        if ((vaddr >> 51 & 3) > (asce & ASCE_TABLE_LENGTH)) {
 297            trigger_page_fault(env, vaddr, PGM_REG_SEC_TRANS, asc, rw, exc);
 298            return -1;
 299        }
 300        break;
 301    case ASCE_TYPE_REGION3:
 302        if (vaddr & 0xfffffc0000000000ULL) {
 303            DPRINTF("%s: vaddr doesn't fit 0x%16" PRIx64
 304                    " 0xfffffc0000000000ULL\n", __func__, vaddr);
 305            trigger_page_fault(env, vaddr, PGM_ASCE_TYPE, asc, rw, exc);
 306            return -1;
 307        }
 308        if ((vaddr >> 40 & 3) > (asce & ASCE_TABLE_LENGTH)) {
 309            trigger_page_fault(env, vaddr, PGM_REG_THIRD_TRANS, asc, rw, exc);
 310            return -1;
 311        }
 312        break;
 313    case ASCE_TYPE_SEGMENT:
 314        if (vaddr & 0xffffffff80000000ULL) {
 315            DPRINTF("%s: vaddr doesn't fit 0x%16" PRIx64
 316                    " 0xffffffff80000000ULL\n", __func__, vaddr);
 317            trigger_page_fault(env, vaddr, PGM_ASCE_TYPE, asc, rw, exc);
 318            return -1;
 319        }
 320        if ((vaddr >> 29 & 3) > (asce & ASCE_TABLE_LENGTH)) {
 321            trigger_page_fault(env, vaddr, PGM_SEGMENT_TRANS, asc, rw, exc);
 322            return -1;
 323        }
 324        break;
 325    }
 326
 327    r = mmu_translate_region(env, vaddr, asc, asce, level, raddr, flags, rw,
 328                             exc);
 329    if (!r && rw == MMU_DATA_STORE && !(*flags & PAGE_WRITE)) {
 330        trigger_prot_fault(env, vaddr, asc, rw, exc);
 331        return -1;
 332    }
 333
 334    return r;
 335}
 336
 337/**
 338 * Translate a virtual (logical) address into a physical (absolute) address.
 339 * @param vaddr  the virtual address
 340 * @param rw     0 = read, 1 = write, 2 = code fetch
 341 * @param asc    address space control (one of the PSW_ASC_* modes)
 342 * @param raddr  the translated address is stored to this pointer
 343 * @param flags  the PAGE_READ/WRITE/EXEC flags are stored to this pointer
 344 * @param exc    true = inject a program check if a fault occurred
 345 * @return       0 if the translation was successful, -1 if a fault occurred
 346 */
 347int mmu_translate(CPUS390XState *env, target_ulong vaddr, int rw, uint64_t asc,
 348                  target_ulong *raddr, int *flags, bool exc)
 349{
 350    static S390SKeysState *ss;
 351    static S390SKeysClass *skeyclass;
 352    int r = -1;
 353    uint8_t key;
 354
 355    if (unlikely(!ss)) {
 356        ss = s390_get_skeys_device();
 357        skeyclass = S390_SKEYS_GET_CLASS(ss);
 358    }
 359
 360    *flags = PAGE_READ | PAGE_WRITE | PAGE_EXEC;
 361    if (is_low_address(vaddr & TARGET_PAGE_MASK) && lowprot_enabled(env, asc)) {
 362        /*
 363         * If any part of this page is currently protected, make sure the
 364         * TLB entry will not be reused.
 365         *
 366         * As the protected range is always the first 512 bytes of the
 367         * two first pages, we are able to catch all writes to these areas
 368         * just by looking at the start address (triggering the tlb miss).
 369         */
 370        *flags |= PAGE_WRITE_INV;
 371        if (is_low_address(vaddr) && rw == MMU_DATA_STORE) {
 372            if (exc) {
 373                trigger_access_exception(env, PGM_PROTECTION, ILEN_AUTO, 0);
 374            }
 375            return -EACCES;
 376        }
 377    }
 378
 379    vaddr &= TARGET_PAGE_MASK;
 380
 381    if (!(env->psw.mask & PSW_MASK_DAT)) {
 382        *raddr = vaddr;
 383        r = 0;
 384        goto out;
 385    }
 386
 387    switch (asc) {
 388    case PSW_ASC_PRIMARY:
 389        PTE_DPRINTF("%s: asc=primary\n", __func__);
 390        r = mmu_translate_asce(env, vaddr, asc, env->cregs[1], raddr, flags,
 391                               rw, exc);
 392        break;
 393    case PSW_ASC_HOME:
 394        PTE_DPRINTF("%s: asc=home\n", __func__);
 395        r = mmu_translate_asce(env, vaddr, asc, env->cregs[13], raddr, flags,
 396                               rw, exc);
 397        break;
 398    case PSW_ASC_SECONDARY:
 399        PTE_DPRINTF("%s: asc=secondary\n", __func__);
 400        /*
 401         * Instruction: Primary
 402         * Data: Secondary
 403         */
 404        if (rw == MMU_INST_FETCH) {
 405            r = mmu_translate_asce(env, vaddr, PSW_ASC_PRIMARY, env->cregs[1],
 406                                   raddr, flags, rw, exc);
 407            *flags &= ~(PAGE_READ | PAGE_WRITE);
 408        } else {
 409            r = mmu_translate_asce(env, vaddr, PSW_ASC_SECONDARY, env->cregs[7],
 410                                   raddr, flags, rw, exc);
 411            *flags &= ~(PAGE_EXEC);
 412        }
 413        break;
 414    case PSW_ASC_ACCREG:
 415    default:
 416        hw_error("guest switched to unknown asc mode\n");
 417        break;
 418    }
 419
 420 out:
 421    /* Convert real address -> absolute address */
 422    *raddr = mmu_real2abs(env, *raddr);
 423
 424    if (r == 0 && *raddr < ram_size) {
 425        if (skeyclass->get_skeys(ss, *raddr / TARGET_PAGE_SIZE, 1, &key)) {
 426            trace_get_skeys_nonzero(r);
 427            return 0;
 428        }
 429
 430        if (*flags & PAGE_READ) {
 431            key |= SK_R;
 432        }
 433
 434        if (*flags & PAGE_WRITE) {
 435            key |= SK_C;
 436        }
 437
 438        if (skeyclass->set_skeys(ss, *raddr / TARGET_PAGE_SIZE, 1, &key)) {
 439            trace_set_skeys_nonzero(r);
 440            return 0;
 441        }
 442    }
 443
 444    return r;
 445}
 446
 447/**
 448 * translate_pages: Translate a set of consecutive logical page addresses
 449 * to absolute addresses. This function is used for TCG and old KVM without
 450 * the MEMOP interface.
 451 */
 452static int translate_pages(S390CPU *cpu, vaddr addr, int nr_pages,
 453                           target_ulong *pages, bool is_write)
 454{
 455    uint64_t asc = cpu->env.psw.mask & PSW_MASK_ASC;
 456    CPUS390XState *env = &cpu->env;
 457    int ret, i, pflags;
 458
 459    for (i = 0; i < nr_pages; i++) {
 460        ret = mmu_translate(env, addr, is_write, asc, &pages[i], &pflags, true);
 461        if (ret) {
 462            return ret;
 463        }
 464        if (!address_space_access_valid(&address_space_memory, pages[i],
 465                                        TARGET_PAGE_SIZE, is_write,
 466                                        MEMTXATTRS_UNSPECIFIED)) {
 467            trigger_access_exception(env, PGM_ADDRESSING, ILEN_AUTO, 0);
 468            return -EFAULT;
 469        }
 470        addr += TARGET_PAGE_SIZE;
 471    }
 472
 473    return 0;
 474}
 475
 476/**
 477 * s390_cpu_virt_mem_rw:
 478 * @laddr:     the logical start address
 479 * @ar:        the access register number
 480 * @hostbuf:   buffer in host memory. NULL = do only checks w/o copying
 481 * @len:       length that should be transferred
 482 * @is_write:  true = write, false = read
 483 * Returns:    0 on success, non-zero if an exception occurred
 484 *
 485 * Copy from/to guest memory using logical addresses. Note that we inject a
 486 * program interrupt in case there is an error while accessing the memory.
 487 *
 488 * This function will always return (also for TCG), make sure to call
 489 * s390_cpu_virt_mem_handle_exc() to properly exit the CPU loop.
 490 */
 491int s390_cpu_virt_mem_rw(S390CPU *cpu, vaddr laddr, uint8_t ar, void *hostbuf,
 492                         int len, bool is_write)
 493{
 494    int currlen, nr_pages, i;
 495    target_ulong *pages;
 496    int ret;
 497
 498    if (kvm_enabled()) {
 499        ret = kvm_s390_mem_op(cpu, laddr, ar, hostbuf, len, is_write);
 500        if (ret >= 0) {
 501            return ret;
 502        }
 503    }
 504
 505    nr_pages = (((laddr & ~TARGET_PAGE_MASK) + len - 1) >> TARGET_PAGE_BITS)
 506               + 1;
 507    pages = g_malloc(nr_pages * sizeof(*pages));
 508
 509    ret = translate_pages(cpu, laddr, nr_pages, pages, is_write);
 510    if (ret == 0 && hostbuf != NULL) {
 511        /* Copy data by stepping through the area page by page */
 512        for (i = 0; i < nr_pages; i++) {
 513            currlen = MIN(len, TARGET_PAGE_SIZE - (laddr % TARGET_PAGE_SIZE));
 514            cpu_physical_memory_rw(pages[i] | (laddr & ~TARGET_PAGE_MASK),
 515                                   hostbuf, currlen, is_write);
 516            laddr += currlen;
 517            hostbuf += currlen;
 518            len -= currlen;
 519        }
 520    }
 521
 522    g_free(pages);
 523    return ret;
 524}
 525
 526void s390_cpu_virt_mem_handle_exc(S390CPU *cpu, uintptr_t ra)
 527{
 528    /* KVM will handle the interrupt automatically, TCG has to exit the TB */
 529#ifdef CONFIG_TCG
 530    if (tcg_enabled()) {
 531        cpu_loop_exit_restore(CPU(cpu), ra);
 532    }
 533#endif
 534}
 535
 536/**
 537 * Translate a real address into a physical (absolute) address.
 538 * @param raddr  the real address
 539 * @param rw     0 = read, 1 = write, 2 = code fetch
 540 * @param addr   the translated address is stored to this pointer
 541 * @param flags  the PAGE_READ/WRITE/EXEC flags are stored to this pointer
 542 * @return       0 if the translation was successful, < 0 if a fault occurred
 543 */
 544int mmu_translate_real(CPUS390XState *env, target_ulong raddr, int rw,
 545                       target_ulong *addr, int *flags)
 546{
 547    const bool lowprot_enabled = env->cregs[0] & CR0_LOWPROT;
 548
 549    *flags = PAGE_READ | PAGE_WRITE | PAGE_EXEC;
 550    if (is_low_address(raddr & TARGET_PAGE_MASK) && lowprot_enabled) {
 551        /* see comment in mmu_translate() how this works */
 552        *flags |= PAGE_WRITE_INV;
 553        if (is_low_address(raddr) && rw == MMU_DATA_STORE) {
 554            trigger_access_exception(env, PGM_PROTECTION, ILEN_AUTO, 0);
 555            return -EACCES;
 556        }
 557    }
 558
 559    *addr = mmu_real2abs(env, raddr & TARGET_PAGE_MASK);
 560
 561    /* TODO: storage key handling */
 562    return 0;
 563}
 564