linux/drivers/gpu/drm/nouveau/nvkm/subdev/fb/ramnv50.c
<<
>>
Prefs
   1/*
   2 * Copyright 2013 Red Hat Inc.
   3 *
   4 * Permission is hereby granted, free of charge, to any person obtaining a
   5 * copy of this software and associated documentation files (the "Software"),
   6 * to deal in the Software without restriction, including without limitation
   7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8 * and/or sell copies of the Software, and to permit persons to whom the
   9 * Software is furnished to do so, subject to the following conditions:
  10 *
  11 * The above copyright notice and this permission notice shall be included in
  12 * all copies or substantial portions of the Software.
  13 *
  14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20 * OTHER DEALINGS IN THE SOFTWARE.
  21 *
  22 * Authors: Ben Skeggs
  23 */
  24#define nv50_ram(p) container_of((p), struct nv50_ram, base)
  25#include "ram.h"
  26#include "ramseq.h"
  27#include "nv50.h"
  28
  29#include <core/option.h>
  30#include <subdev/bios.h>
  31#include <subdev/bios/perf.h>
  32#include <subdev/bios/pll.h>
  33#include <subdev/bios/rammap.h>
  34#include <subdev/bios/timing.h>
  35#include <subdev/clk/pll.h>
  36#include <subdev/gpio.h>
  37
  38struct nv50_ramseq {
  39        struct hwsq base;
  40        struct hwsq_reg r_0x002504;
  41        struct hwsq_reg r_0x004008;
  42        struct hwsq_reg r_0x00400c;
  43        struct hwsq_reg r_0x00c040;
  44        struct hwsq_reg r_0x100200;
  45        struct hwsq_reg r_0x100210;
  46        struct hwsq_reg r_0x10021c;
  47        struct hwsq_reg r_0x1002d0;
  48        struct hwsq_reg r_0x1002d4;
  49        struct hwsq_reg r_0x1002dc;
  50        struct hwsq_reg r_0x10053c;
  51        struct hwsq_reg r_0x1005a0;
  52        struct hwsq_reg r_0x1005a4;
  53        struct hwsq_reg r_0x100710;
  54        struct hwsq_reg r_0x100714;
  55        struct hwsq_reg r_0x100718;
  56        struct hwsq_reg r_0x10071c;
  57        struct hwsq_reg r_0x100da0;
  58        struct hwsq_reg r_0x100e20;
  59        struct hwsq_reg r_0x100e24;
  60        struct hwsq_reg r_0x611200;
  61        struct hwsq_reg r_timing[9];
  62        struct hwsq_reg r_mr[4];
  63        struct hwsq_reg r_gpio[4];
  64};
  65
  66struct nv50_ram {
  67        struct nvkm_ram base;
  68        struct nv50_ramseq hwsq;
  69};
  70
  71#define T(t) cfg->timing_10_##t
  72static int
  73nv50_ram_timing_calc(struct nv50_ram *ram, u32 *timing)
  74{
  75        struct nvbios_ramcfg *cfg = &ram->base.target.bios;
  76        struct nvkm_subdev *subdev = &ram->base.fb->subdev;
  77        struct nvkm_device *device = subdev->device;
  78        u32 cur2, cur4, cur7, cur8;
  79        u8 unkt3b;
  80
  81        cur2 = nvkm_rd32(device, 0x100228);
  82        cur4 = nvkm_rd32(device, 0x100230);
  83        cur7 = nvkm_rd32(device, 0x10023c);
  84        cur8 = nvkm_rd32(device, 0x100240);
  85
  86        switch ((!T(CWL)) * ram->base.type) {
  87        case NVKM_RAM_TYPE_DDR2:
  88                T(CWL) = T(CL) - 1;
  89                break;
  90        case NVKM_RAM_TYPE_GDDR3:
  91                T(CWL) = ((cur2 & 0xff000000) >> 24) + 1;
  92                break;
  93        }
  94
  95        /* XXX: N=1 is not proper statistics */
  96        if (device->chipset == 0xa0) {
  97                unkt3b = 0x19 + ram->base.next->bios.rammap_00_16_40;
  98                timing[6] = (0x2d + T(CL) - T(CWL) +
  99                                ram->base.next->bios.rammap_00_16_40) << 16 |
 100                            T(CWL) << 8 |
 101                            (0x2f + T(CL) - T(CWL));
 102        } else {
 103                unkt3b = 0x16;
 104                timing[6] = (0x2b + T(CL) - T(CWL)) << 16 |
 105                            max_t(s8, T(CWL) - 2, 1) << 8 |
 106                            (0x2e + T(CL) - T(CWL));
 107        }
 108
 109        timing[0] = (T(RP) << 24 | T(RAS) << 16 | T(RFC) << 8 | T(RC));
 110        timing[1] = (T(WR) + 1 + T(CWL)) << 24 |
 111                    max_t(u8, T(18), 1) << 16 |
 112                    (T(WTR) + 1 + T(CWL)) << 8 |
 113                    (3 + T(CL) - T(CWL));
 114        timing[2] = (T(CWL) - 1) << 24 |
 115                    (T(RRD) << 16) |
 116                    (T(RCDWR) << 8) |
 117                    T(RCDRD);
 118        timing[3] = (unkt3b - 2 + T(CL)) << 24 |
 119                    unkt3b << 16 |
 120                    (T(CL) - 1) << 8 |
 121                    (T(CL) - 1);
 122        timing[4] = (cur4 & 0xffff0000) |
 123                    T(13) << 8 |
 124                    T(13);
 125        timing[5] = T(RFC) << 24 |
 126                    max_t(u8, T(RCDRD), T(RCDWR)) << 16 |
 127                    T(RP);
 128        /* Timing 6 is already done above */
 129        timing[7] = (cur7 & 0xff00ffff) | (T(CL) - 1) << 16;
 130        timing[8] = (cur8 & 0xffffff00);
 131
 132        /* XXX: P.version == 1 only has DDR2 and GDDR3? */
 133        if (ram->base.type == NVKM_RAM_TYPE_DDR2) {
 134                timing[5] |= (T(CL) + 3) << 8;
 135                timing[8] |= (T(CL) - 4);
 136        } else
 137        if (ram->base.type == NVKM_RAM_TYPE_GDDR3) {
 138                timing[5] |= (T(CL) + 2) << 8;
 139                timing[8] |= (T(CL) - 2);
 140        }
 141
 142        nvkm_debug(subdev, " 220: %08x %08x %08x %08x\n",
 143                   timing[0], timing[1], timing[2], timing[3]);
 144        nvkm_debug(subdev, " 230: %08x %08x %08x %08x\n",
 145                   timing[4], timing[5], timing[6], timing[7]);
 146        nvkm_debug(subdev, " 240: %08x\n", timing[8]);
 147        return 0;
 148}
 149
 150static int
 151nv50_ram_timing_read(struct nv50_ram *ram, u32 *timing)
 152{
 153        unsigned int i;
 154        struct nvbios_ramcfg *cfg = &ram->base.target.bios;
 155        struct nvkm_subdev *subdev = &ram->base.fb->subdev;
 156        struct nvkm_device *device = subdev->device;
 157
 158        for (i = 0; i <= 8; i++)
 159                timing[i] = nvkm_rd32(device, 0x100220 + (i * 4));
 160
 161        /* Derive the bare minimum for the MR calculation to succeed */
 162        cfg->timing_ver = 0x10;
 163        T(CL) = (timing[3] & 0xff) + 1;
 164
 165        switch (ram->base.type) {
 166        case NVKM_RAM_TYPE_DDR2:
 167                T(CWL) = T(CL) - 1;
 168                break;
 169        case NVKM_RAM_TYPE_GDDR3:
 170                T(CWL) = ((timing[2] & 0xff000000) >> 24) + 1;
 171                break;
 172        default:
 173                return -ENOSYS;
 174                break;
 175        }
 176
 177        T(WR) = ((timing[1] >> 24) & 0xff) - 1 - T(CWL);
 178
 179        return 0;
 180}
 181#undef T
 182
 183static void
 184nvkm_sddr2_dll_reset(struct nv50_ramseq *hwsq)
 185{
 186        ram_mask(hwsq, mr[0], 0x100, 0x100);
 187        ram_mask(hwsq, mr[0], 0x100, 0x000);
 188        ram_nsec(hwsq, 24000);
 189}
 190
 191static void
 192nv50_ram_gpio(struct nv50_ramseq *hwsq, u8 tag, u32 val)
 193{
 194        struct nvkm_gpio *gpio = hwsq->base.subdev->device->gpio;
 195        struct dcb_gpio_func func;
 196        u32 reg, sh, gpio_val;
 197        int ret;
 198
 199        if (nvkm_gpio_get(gpio, 0, tag, DCB_GPIO_UNUSED) != val) {
 200                ret = nvkm_gpio_find(gpio, 0, tag, DCB_GPIO_UNUSED, &func);
 201                if (ret)
 202                        return;
 203
 204                reg = func.line >> 3;
 205                sh = (func.line & 0x7) << 2;
 206                gpio_val = ram_rd32(hwsq, gpio[reg]);
 207
 208                if (gpio_val & (8 << sh))
 209                        val = !val;
 210                if (!(func.log[1] & 1))
 211                        val = !val;
 212
 213                ram_mask(hwsq, gpio[reg], (0x3 << sh), ((val | 0x2) << sh));
 214                ram_nsec(hwsq, 20000);
 215        }
 216}
 217
 218static int
 219nv50_ram_calc(struct nvkm_ram *base, u32 freq)
 220{
 221        struct nv50_ram *ram = nv50_ram(base);
 222        struct nv50_ramseq *hwsq = &ram->hwsq;
 223        struct nvkm_subdev *subdev = &ram->base.fb->subdev;
 224        struct nvkm_bios *bios = subdev->device->bios;
 225        struct nvbios_perfE perfE;
 226        struct nvbios_pll mpll;
 227        struct nvkm_ram_data *next;
 228        u8  ver, hdr, cnt, len, strap, size;
 229        u32 data;
 230        u32 r100da0, r004008, unk710, unk714, unk718, unk71c;
 231        int N1, M1, N2, M2, P;
 232        int ret, i;
 233        u32 timing[9];
 234
 235        next = &ram->base.target;
 236        next->freq = freq;
 237        ram->base.next = next;
 238
 239        /* lookup closest matching performance table entry for frequency */
 240        i = 0;
 241        do {
 242                data = nvbios_perfEp(bios, i++, &ver, &hdr, &cnt,
 243                                     &size, &perfE);
 244                if (!data || (ver < 0x25 || ver >= 0x40) ||
 245                    (size < 2)) {
 246                        nvkm_error(subdev, "invalid/missing perftab entry\n");
 247                        return -EINVAL;
 248                }
 249        } while (perfE.memory < freq);
 250
 251        nvbios_rammapEp_from_perf(bios, data, hdr, &next->bios);
 252
 253        /* locate specific data set for the attached memory */
 254        strap = nvbios_ramcfg_index(subdev);
 255        if (strap >= cnt) {
 256                nvkm_error(subdev, "invalid ramcfg strap\n");
 257                return -EINVAL;
 258        }
 259
 260        data = nvbios_rammapSp_from_perf(bios, data + hdr, size, strap,
 261                        &next->bios);
 262        if (!data) {
 263                nvkm_error(subdev, "invalid/missing rammap entry ");
 264                return -EINVAL;
 265        }
 266
 267        /* lookup memory timings, if bios says they're present */
 268        if (next->bios.ramcfg_timing != 0xff) {
 269                data = nvbios_timingEp(bios, next->bios.ramcfg_timing,
 270                                        &ver, &hdr, &cnt, &len, &next->bios);
 271                if (!data || ver != 0x10 || hdr < 0x12) {
 272                        nvkm_error(subdev, "invalid/missing timing entry "
 273                                 "%02x %04x %02x %02x\n",
 274                                 strap, data, ver, hdr);
 275                        return -EINVAL;
 276                }
 277                nv50_ram_timing_calc(ram, timing);
 278        } else {
 279                nv50_ram_timing_read(ram, timing);
 280        }
 281
 282        ret = ram_init(hwsq, subdev);
 283        if (ret)
 284                return ret;
 285
 286        /* Determine ram-specific MR values */
 287        ram->base.mr[0] = ram_rd32(hwsq, mr[0]);
 288        ram->base.mr[1] = ram_rd32(hwsq, mr[1]);
 289        ram->base.mr[2] = ram_rd32(hwsq, mr[2]);
 290
 291        switch (ram->base.type) {
 292        case NVKM_RAM_TYPE_GDDR3:
 293                ret = nvkm_gddr3_calc(&ram->base);
 294                break;
 295        default:
 296                ret = -ENOSYS;
 297                break;
 298        }
 299
 300        if (ret) {
 301                nvkm_error(subdev, "Could not calculate MR\n");
 302                return ret;
 303        }
 304
 305        if (subdev->device->chipset <= 0x96 && !next->bios.ramcfg_00_03_02)
 306                ram_mask(hwsq, 0x100710, 0x00000200, 0x00000000);
 307
 308        /* Always disable this bit during reclock */
 309        ram_mask(hwsq, 0x100200, 0x00000800, 0x00000000);
 310
 311        ram_wait_vblank(hwsq);
 312        ram_wr32(hwsq, 0x611200, 0x00003300);
 313        ram_wr32(hwsq, 0x002504, 0x00000001); /* block fifo */
 314        ram_nsec(hwsq, 8000);
 315        ram_setf(hwsq, 0x10, 0x00); /* disable fb */
 316        ram_wait(hwsq, 0x00, 0x01); /* wait for fb disabled */
 317        ram_nsec(hwsq, 2000);
 318
 319        if (next->bios.timing_10_ODT)
 320                nv50_ram_gpio(hwsq, 0x2e, 1);
 321
 322        ram_wr32(hwsq, 0x1002d4, 0x00000001); /* precharge */
 323        ram_wr32(hwsq, 0x1002d0, 0x00000001); /* refresh */
 324        ram_wr32(hwsq, 0x1002d0, 0x00000001); /* refresh */
 325        ram_wr32(hwsq, 0x100210, 0x00000000); /* disable auto-refresh */
 326        ram_wr32(hwsq, 0x1002dc, 0x00000001); /* enable self-refresh */
 327
 328        ret = nvbios_pll_parse(bios, 0x004008, &mpll);
 329        mpll.vco2.max_freq = 0;
 330        if (ret >= 0) {
 331                ret = nv04_pll_calc(subdev, &mpll, freq,
 332                                    &N1, &M1, &N2, &M2, &P);
 333                if (ret <= 0)
 334                        ret = -EINVAL;
 335        }
 336
 337        if (ret < 0)
 338                return ret;
 339
 340        /* XXX: 750MHz seems rather arbitrary */
 341        if (freq <= 750000) {
 342                r100da0 = 0x00000010;
 343                r004008 = 0x90000000;
 344        } else {
 345                r100da0 = 0x00000000;
 346                r004008 = 0x80000000;
 347        }
 348
 349        r004008 |= (mpll.bias_p << 19) | (P << 22) | (P << 16);
 350
 351        ram_mask(hwsq, 0x00c040, 0xc000c000, 0x0000c000);
 352        /* XXX: Is rammap_00_16_40 the DLL bit we've seen in GT215? Why does
 353         * it have a different rammap bit from DLLoff? */
 354        ram_mask(hwsq, 0x004008, 0x00004200, 0x00000200 |
 355                        next->bios.rammap_00_16_40 << 14);
 356        ram_mask(hwsq, 0x00400c, 0x0000ffff, (N1 << 8) | M1);
 357        ram_mask(hwsq, 0x004008, 0x91ff0000, r004008);
 358
 359        /* XXX: GDDR3 only? */
 360        if (subdev->device->chipset >= 0x92)
 361                ram_wr32(hwsq, 0x100da0, r100da0);
 362
 363        nv50_ram_gpio(hwsq, 0x18, !next->bios.ramcfg_FBVDDQ);
 364        ram_nsec(hwsq, 64000); /*XXX*/
 365        ram_nsec(hwsq, 32000); /*XXX*/
 366
 367        ram_mask(hwsq, 0x004008, 0x00002200, 0x00002000);
 368
 369        ram_wr32(hwsq, 0x1002dc, 0x00000000); /* disable self-refresh */
 370        ram_wr32(hwsq, 0x1002d4, 0x00000001); /* disable self-refresh */
 371        ram_wr32(hwsq, 0x100210, 0x80000000); /* enable auto-refresh */
 372
 373        ram_nsec(hwsq, 12000);
 374
 375        switch (ram->base.type) {
 376        case NVKM_RAM_TYPE_DDR2:
 377                ram_nuke(hwsq, mr[0]); /* force update */
 378                ram_mask(hwsq, mr[0], 0x000, 0x000);
 379                break;
 380        case NVKM_RAM_TYPE_GDDR3:
 381                ram_nuke(hwsq, mr[1]); /* force update */
 382                ram_wr32(hwsq, mr[1], ram->base.mr[1]);
 383                ram_nuke(hwsq, mr[0]); /* force update */
 384                ram_wr32(hwsq, mr[0], ram->base.mr[0]);
 385                break;
 386        default:
 387                break;
 388        }
 389
 390        ram_mask(hwsq, timing[3], 0xffffffff, timing[3]);
 391        ram_mask(hwsq, timing[1], 0xffffffff, timing[1]);
 392        ram_mask(hwsq, timing[6], 0xffffffff, timing[6]);
 393        ram_mask(hwsq, timing[7], 0xffffffff, timing[7]);
 394        ram_mask(hwsq, timing[8], 0xffffffff, timing[8]);
 395        ram_mask(hwsq, timing[0], 0xffffffff, timing[0]);
 396        ram_mask(hwsq, timing[2], 0xffffffff, timing[2]);
 397        ram_mask(hwsq, timing[4], 0xffffffff, timing[4]);
 398        ram_mask(hwsq, timing[5], 0xffffffff, timing[5]);
 399
 400        if (!next->bios.ramcfg_00_03_02)
 401                ram_mask(hwsq, 0x10021c, 0x00010000, 0x00000000);
 402        ram_mask(hwsq, 0x100200, 0x00001000, !next->bios.ramcfg_00_04_02 << 12);
 403
 404        /* XXX: A lot of this could be "chipset"/"ram type" specific stuff */
 405        unk710  = ram_rd32(hwsq, 0x100710) & ~0x00000100;
 406        unk714  = ram_rd32(hwsq, 0x100714) & ~0xf0000020;
 407        unk718  = ram_rd32(hwsq, 0x100718) & ~0x00000100;
 408        unk71c  = ram_rd32(hwsq, 0x10071c) & ~0x00000100;
 409        if (subdev->device->chipset <= 0x96) {
 410                unk710 &= ~0x0000006e;
 411                unk714 &= ~0x00000100;
 412
 413                if (!next->bios.ramcfg_00_03_08)
 414                        unk710 |= 0x00000060;
 415                if (!next->bios.ramcfg_FBVDDQ)
 416                        unk714 |= 0x00000100;
 417                if ( next->bios.ramcfg_00_04_04)
 418                        unk710 |= 0x0000000e;
 419        } else {
 420                unk710 &= ~0x00000001;
 421
 422                if (!next->bios.ramcfg_00_03_08)
 423                        unk710 |= 0x00000001;
 424        }
 425
 426        if ( next->bios.ramcfg_00_03_01)
 427                unk71c |= 0x00000100;
 428        if ( next->bios.ramcfg_00_03_02)
 429                unk710 |= 0x00000100;
 430        if (!next->bios.ramcfg_00_03_08)
 431                unk714 |= 0x00000020;
 432        if ( next->bios.ramcfg_00_04_04)
 433                unk714 |= 0x70000000;
 434        if ( next->bios.ramcfg_00_04_20)
 435                unk718 |= 0x00000100;
 436
 437        ram_mask(hwsq, 0x100714, 0xffffffff, unk714);
 438        ram_mask(hwsq, 0x10071c, 0xffffffff, unk71c);
 439        ram_mask(hwsq, 0x100718, 0xffffffff, unk718);
 440        ram_mask(hwsq, 0x100710, 0xffffffff, unk710);
 441
 442        /* XXX: G94 does not even test these regs in trace. Harmless we do it,
 443         * but why is it omitted? */
 444        if (next->bios.rammap_00_16_20) {
 445                ram_wr32(hwsq, 0x1005a0, next->bios.ramcfg_00_07 << 16 |
 446                                         next->bios.ramcfg_00_06 << 8 |
 447                                         next->bios.ramcfg_00_05);
 448                ram_wr32(hwsq, 0x1005a4, next->bios.ramcfg_00_09 << 8 |
 449                                         next->bios.ramcfg_00_08);
 450                ram_mask(hwsq, 0x10053c, 0x00001000, 0x00000000);
 451        } else {
 452                ram_mask(hwsq, 0x10053c, 0x00001000, 0x00001000);
 453        }
 454        ram_mask(hwsq, mr[1], 0xffffffff, ram->base.mr[1]);
 455
 456        if (!next->bios.timing_10_ODT)
 457                nv50_ram_gpio(hwsq, 0x2e, 0);
 458
 459        /* Reset DLL */
 460        if (!next->bios.ramcfg_DLLoff)
 461                nvkm_sddr2_dll_reset(hwsq);
 462
 463        ram_setf(hwsq, 0x10, 0x01); /* enable fb */
 464        ram_wait(hwsq, 0x00, 0x00); /* wait for fb enabled */
 465        ram_wr32(hwsq, 0x611200, 0x00003330);
 466        ram_wr32(hwsq, 0x002504, 0x00000000); /* un-block fifo */
 467
 468        if (next->bios.rammap_00_17_02)
 469                ram_mask(hwsq, 0x100200, 0x00000800, 0x00000800);
 470        if (!next->bios.rammap_00_16_40)
 471                ram_mask(hwsq, 0x004008, 0x00004000, 0x00000000);
 472        if (next->bios.ramcfg_00_03_02)
 473                ram_mask(hwsq, 0x10021c, 0x00010000, 0x00010000);
 474        if (subdev->device->chipset <= 0x96 && next->bios.ramcfg_00_03_02)
 475                ram_mask(hwsq, 0x100710, 0x00000200, 0x00000200);
 476
 477        return 0;
 478}
 479
 480static int
 481nv50_ram_prog(struct nvkm_ram *base)
 482{
 483        struct nv50_ram *ram = nv50_ram(base);
 484        struct nvkm_device *device = ram->base.fb->subdev.device;
 485        ram_exec(&ram->hwsq, nvkm_boolopt(device->cfgopt, "NvMemExec", true));
 486        return 0;
 487}
 488
 489static void
 490nv50_ram_tidy(struct nvkm_ram *base)
 491{
 492        struct nv50_ram *ram = nv50_ram(base);
 493        ram_exec(&ram->hwsq, false);
 494}
 495
 496void
 497__nv50_ram_put(struct nvkm_ram *ram, struct nvkm_mem *mem)
 498{
 499        struct nvkm_mm_node *this;
 500
 501        while (!list_empty(&mem->regions)) {
 502                this = list_first_entry(&mem->regions, typeof(*this), rl_entry);
 503
 504                list_del(&this->rl_entry);
 505                nvkm_mm_free(&ram->vram, &this);
 506        }
 507
 508        nvkm_mm_free(&ram->tags, &mem->tag);
 509}
 510
 511void
 512nv50_ram_put(struct nvkm_ram *ram, struct nvkm_mem **pmem)
 513{
 514        struct nvkm_mem *mem = *pmem;
 515
 516        *pmem = NULL;
 517        if (unlikely(mem == NULL))
 518                return;
 519
 520        mutex_lock(&ram->fb->subdev.mutex);
 521        __nv50_ram_put(ram, mem);
 522        mutex_unlock(&ram->fb->subdev.mutex);
 523
 524        kfree(mem);
 525}
 526
 527int
 528nv50_ram_get(struct nvkm_ram *ram, u64 size, u32 align, u32 ncmin,
 529             u32 memtype, struct nvkm_mem **pmem)
 530{
 531        struct nvkm_mm *heap = &ram->vram;
 532        struct nvkm_mm *tags = &ram->tags;
 533        struct nvkm_mm_node *r;
 534        struct nvkm_mem *mem;
 535        int comp = (memtype & 0x300) >> 8;
 536        int type = (memtype & 0x07f);
 537        int back = (memtype & 0x800);
 538        int min, max, ret;
 539
 540        max = (size >> NVKM_RAM_MM_SHIFT);
 541        min = ncmin ? (ncmin >> NVKM_RAM_MM_SHIFT) : max;
 542        align >>= NVKM_RAM_MM_SHIFT;
 543
 544        mem = kzalloc(sizeof(*mem), GFP_KERNEL);
 545        if (!mem)
 546                return -ENOMEM;
 547
 548        mutex_lock(&ram->fb->subdev.mutex);
 549        if (comp) {
 550                if (align == (1 << (16 - NVKM_RAM_MM_SHIFT))) {
 551                        int n = (max >> 4) * comp;
 552
 553                        ret = nvkm_mm_head(tags, 0, 1, n, n, 1, &mem->tag);
 554                        if (ret)
 555                                mem->tag = NULL;
 556                }
 557
 558                if (unlikely(!mem->tag))
 559                        comp = 0;
 560        }
 561
 562        INIT_LIST_HEAD(&mem->regions);
 563        mem->memtype = (comp << 7) | type;
 564        mem->size = max;
 565
 566        type = nv50_fb_memtype[type];
 567        do {
 568                if (back)
 569                        ret = nvkm_mm_tail(heap, 0, type, max, min, align, &r);
 570                else
 571                        ret = nvkm_mm_head(heap, 0, type, max, min, align, &r);
 572                if (ret) {
 573                        mutex_unlock(&ram->fb->subdev.mutex);
 574                        ram->func->put(ram, &mem);
 575                        return ret;
 576                }
 577
 578                list_add_tail(&r->rl_entry, &mem->regions);
 579                max -= r->length;
 580        } while (max);
 581        mutex_unlock(&ram->fb->subdev.mutex);
 582
 583        r = list_first_entry(&mem->regions, struct nvkm_mm_node, rl_entry);
 584        mem->offset = (u64)r->offset << NVKM_RAM_MM_SHIFT;
 585        *pmem = mem;
 586        return 0;
 587}
 588
 589static const struct nvkm_ram_func
 590nv50_ram_func = {
 591        .get = nv50_ram_get,
 592        .put = nv50_ram_put,
 593        .calc = nv50_ram_calc,
 594        .prog = nv50_ram_prog,
 595        .tidy = nv50_ram_tidy,
 596};
 597
 598static u32
 599nv50_fb_vram_rblock(struct nvkm_ram *ram)
 600{
 601        struct nvkm_subdev *subdev = &ram->fb->subdev;
 602        struct nvkm_device *device = subdev->device;
 603        int colbits, rowbitsa, rowbitsb, banks;
 604        u64 rowsize, predicted;
 605        u32 r0, r4, rt, rblock_size;
 606
 607        r0 = nvkm_rd32(device, 0x100200);
 608        r4 = nvkm_rd32(device, 0x100204);
 609        rt = nvkm_rd32(device, 0x100250);
 610        nvkm_debug(subdev, "memcfg %08x %08x %08x %08x\n",
 611                   r0, r4, rt, nvkm_rd32(device, 0x001540));
 612
 613        colbits  =  (r4 & 0x0000f000) >> 12;
 614        rowbitsa = ((r4 & 0x000f0000) >> 16) + 8;
 615        rowbitsb = ((r4 & 0x00f00000) >> 20) + 8;
 616        banks    = 1 << (((r4 & 0x03000000) >> 24) + 2);
 617
 618        rowsize = ram->parts * banks * (1 << colbits) * 8;
 619        predicted = rowsize << rowbitsa;
 620        if (r0 & 0x00000004)
 621                predicted += rowsize << rowbitsb;
 622
 623        if (predicted != ram->size) {
 624                nvkm_warn(subdev, "memory controller reports %d MiB VRAM\n",
 625                          (u32)(ram->size >> 20));
 626        }
 627
 628        rblock_size = rowsize;
 629        if (rt & 1)
 630                rblock_size *= 3;
 631
 632        nvkm_debug(subdev, "rblock %d bytes\n", rblock_size);
 633        return rblock_size;
 634}
 635
 636int
 637nv50_ram_ctor(const struct nvkm_ram_func *func,
 638              struct nvkm_fb *fb, struct nvkm_ram *ram)
 639{
 640        struct nvkm_device *device = fb->subdev.device;
 641        struct nvkm_bios *bios = device->bios;
 642        const u32 rsvd_head = ( 256 * 1024); /* vga memory */
 643        const u32 rsvd_tail = (1024 * 1024); /* vbios etc */
 644        u64 size = nvkm_rd32(device, 0x10020c);
 645        u32 tags = nvkm_rd32(device, 0x100320);
 646        enum nvkm_ram_type type = NVKM_RAM_TYPE_UNKNOWN;
 647        int ret;
 648
 649        switch (nvkm_rd32(device, 0x100714) & 0x00000007) {
 650        case 0: type = NVKM_RAM_TYPE_DDR1; break;
 651        case 1:
 652                if (nvkm_fb_bios_memtype(bios) == NVKM_RAM_TYPE_DDR3)
 653                        type = NVKM_RAM_TYPE_DDR3;
 654                else
 655                        type = NVKM_RAM_TYPE_DDR2;
 656                break;
 657        case 2: type = NVKM_RAM_TYPE_GDDR3; break;
 658        case 3: type = NVKM_RAM_TYPE_GDDR4; break;
 659        case 4: type = NVKM_RAM_TYPE_GDDR5; break;
 660        default:
 661                break;
 662        }
 663
 664        size = (size & 0x000000ff) << 32 | (size & 0xffffff00);
 665
 666        ret = nvkm_ram_ctor(func, fb, type, size, tags, ram);
 667        if (ret)
 668                return ret;
 669
 670        ram->part_mask = (nvkm_rd32(device, 0x001540) & 0x00ff0000) >> 16;
 671        ram->parts = hweight8(ram->part_mask);
 672        ram->ranks = (nvkm_rd32(device, 0x100200) & 0x4) ? 2 : 1;
 673        nvkm_mm_fini(&ram->vram);
 674
 675        return nvkm_mm_init(&ram->vram, rsvd_head >> NVKM_RAM_MM_SHIFT,
 676                            (size - rsvd_head - rsvd_tail) >> NVKM_RAM_MM_SHIFT,
 677                            nv50_fb_vram_rblock(ram) >> NVKM_RAM_MM_SHIFT);
 678}
 679
 680int
 681nv50_ram_new(struct nvkm_fb *fb, struct nvkm_ram **pram)
 682{
 683        struct nv50_ram *ram;
 684        int ret, i;
 685
 686        if (!(ram = kzalloc(sizeof(*ram), GFP_KERNEL)))
 687                return -ENOMEM;
 688        *pram = &ram->base;
 689
 690        ret = nv50_ram_ctor(&nv50_ram_func, fb, &ram->base);
 691        if (ret)
 692                return ret;
 693
 694        ram->hwsq.r_0x002504 = hwsq_reg(0x002504);
 695        ram->hwsq.r_0x00c040 = hwsq_reg(0x00c040);
 696        ram->hwsq.r_0x004008 = hwsq_reg(0x004008);
 697        ram->hwsq.r_0x00400c = hwsq_reg(0x00400c);
 698        ram->hwsq.r_0x100200 = hwsq_reg(0x100200);
 699        ram->hwsq.r_0x100210 = hwsq_reg(0x100210);
 700        ram->hwsq.r_0x10021c = hwsq_reg(0x10021c);
 701        ram->hwsq.r_0x1002d0 = hwsq_reg(0x1002d0);
 702        ram->hwsq.r_0x1002d4 = hwsq_reg(0x1002d4);
 703        ram->hwsq.r_0x1002dc = hwsq_reg(0x1002dc);
 704        ram->hwsq.r_0x10053c = hwsq_reg(0x10053c);
 705        ram->hwsq.r_0x1005a0 = hwsq_reg(0x1005a0);
 706        ram->hwsq.r_0x1005a4 = hwsq_reg(0x1005a4);
 707        ram->hwsq.r_0x100710 = hwsq_reg(0x100710);
 708        ram->hwsq.r_0x100714 = hwsq_reg(0x100714);
 709        ram->hwsq.r_0x100718 = hwsq_reg(0x100718);
 710        ram->hwsq.r_0x10071c = hwsq_reg(0x10071c);
 711        ram->hwsq.r_0x100da0 = hwsq_stride(0x100da0, 4, ram->base.part_mask);
 712        ram->hwsq.r_0x100e20 = hwsq_reg(0x100e20);
 713        ram->hwsq.r_0x100e24 = hwsq_reg(0x100e24);
 714        ram->hwsq.r_0x611200 = hwsq_reg(0x611200);
 715
 716        for (i = 0; i < 9; i++)
 717                ram->hwsq.r_timing[i] = hwsq_reg(0x100220 + (i * 0x04));
 718
 719        if (ram->base.ranks > 1) {
 720                ram->hwsq.r_mr[0] = hwsq_reg2(0x1002c0, 0x1002c8);
 721                ram->hwsq.r_mr[1] = hwsq_reg2(0x1002c4, 0x1002cc);
 722                ram->hwsq.r_mr[2] = hwsq_reg2(0x1002e0, 0x1002e8);
 723                ram->hwsq.r_mr[3] = hwsq_reg2(0x1002e4, 0x1002ec);
 724        } else {
 725                ram->hwsq.r_mr[0] = hwsq_reg(0x1002c0);
 726                ram->hwsq.r_mr[1] = hwsq_reg(0x1002c4);
 727                ram->hwsq.r_mr[2] = hwsq_reg(0x1002e0);
 728                ram->hwsq.r_mr[3] = hwsq_reg(0x1002e4);
 729        }
 730
 731        ram->hwsq.r_gpio[0] = hwsq_reg(0x00e104);
 732        ram->hwsq.r_gpio[1] = hwsq_reg(0x00e108);
 733        ram->hwsq.r_gpio[2] = hwsq_reg(0x00e120);
 734        ram->hwsq.r_gpio[3] = hwsq_reg(0x00e124);
 735
 736        return 0;
 737}
 738