linux/drivers/gpu/drm/etnaviv/etnaviv_buffer.c
<<
>>
Prefs
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 * Copyright (C) 2014-2018 Etnaviv Project
   4 */
   5
   6#include <drm/drm_drv.h>
   7
   8#include "etnaviv_cmdbuf.h"
   9#include "etnaviv_gpu.h"
  10#include "etnaviv_gem.h"
  11#include "etnaviv_mmu.h"
  12
  13#include "common.xml.h"
  14#include "state.xml.h"
  15#include "state_hi.xml.h"
  16#include "state_3d.xml.h"
  17#include "cmdstream.xml.h"
  18
  19/*
  20 * Command Buffer helper:
  21 */
  22
  23
  24static inline void OUT(struct etnaviv_cmdbuf *buffer, u32 data)
  25{
  26        u32 *vaddr = (u32 *)buffer->vaddr;
  27
  28        BUG_ON(buffer->user_size >= buffer->size);
  29
  30        vaddr[buffer->user_size / 4] = data;
  31        buffer->user_size += 4;
  32}
  33
  34static inline void CMD_LOAD_STATE(struct etnaviv_cmdbuf *buffer,
  35        u32 reg, u32 value)
  36{
  37        u32 index = reg >> VIV_FE_LOAD_STATE_HEADER_OFFSET__SHR;
  38
  39        buffer->user_size = ALIGN(buffer->user_size, 8);
  40
  41        /* write a register via cmd stream */
  42        OUT(buffer, VIV_FE_LOAD_STATE_HEADER_OP_LOAD_STATE |
  43                    VIV_FE_LOAD_STATE_HEADER_COUNT(1) |
  44                    VIV_FE_LOAD_STATE_HEADER_OFFSET(index));
  45        OUT(buffer, value);
  46}
  47
  48static inline void CMD_END(struct etnaviv_cmdbuf *buffer)
  49{
  50        buffer->user_size = ALIGN(buffer->user_size, 8);
  51
  52        OUT(buffer, VIV_FE_END_HEADER_OP_END);
  53}
  54
  55static inline void CMD_WAIT(struct etnaviv_cmdbuf *buffer)
  56{
  57        buffer->user_size = ALIGN(buffer->user_size, 8);
  58
  59        OUT(buffer, VIV_FE_WAIT_HEADER_OP_WAIT | 200);
  60}
  61
  62static inline void CMD_LINK(struct etnaviv_cmdbuf *buffer,
  63        u16 prefetch, u32 address)
  64{
  65        buffer->user_size = ALIGN(buffer->user_size, 8);
  66
  67        OUT(buffer, VIV_FE_LINK_HEADER_OP_LINK |
  68                    VIV_FE_LINK_HEADER_PREFETCH(prefetch));
  69        OUT(buffer, address);
  70}
  71
  72static inline void CMD_STALL(struct etnaviv_cmdbuf *buffer,
  73        u32 from, u32 to)
  74{
  75        buffer->user_size = ALIGN(buffer->user_size, 8);
  76
  77        OUT(buffer, VIV_FE_STALL_HEADER_OP_STALL);
  78        OUT(buffer, VIV_FE_STALL_TOKEN_FROM(from) | VIV_FE_STALL_TOKEN_TO(to));
  79}
  80
  81static inline void CMD_SEM(struct etnaviv_cmdbuf *buffer, u32 from, u32 to)
  82{
  83        CMD_LOAD_STATE(buffer, VIVS_GL_SEMAPHORE_TOKEN,
  84                       VIVS_GL_SEMAPHORE_TOKEN_FROM(from) |
  85                       VIVS_GL_SEMAPHORE_TOKEN_TO(to));
  86}
  87
  88static void etnaviv_cmd_select_pipe(struct etnaviv_gpu *gpu,
  89        struct etnaviv_cmdbuf *buffer, u8 pipe)
  90{
  91        u32 flush = 0;
  92
  93        lockdep_assert_held(&gpu->lock);
  94
  95        /*
  96         * This assumes that if we're switching to 2D, we're switching
  97         * away from 3D, and vice versa.  Hence, if we're switching to
  98         * the 2D core, we need to flush the 3D depth and color caches,
  99         * otherwise we need to flush the 2D pixel engine cache.
 100         */
 101        if (gpu->exec_state == ETNA_PIPE_2D)
 102                flush = VIVS_GL_FLUSH_CACHE_PE2D;
 103        else if (gpu->exec_state == ETNA_PIPE_3D)
 104                flush = VIVS_GL_FLUSH_CACHE_DEPTH | VIVS_GL_FLUSH_CACHE_COLOR;
 105
 106        CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE, flush);
 107        CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 108        CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 109
 110        CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
 111                       VIVS_GL_PIPE_SELECT_PIPE(pipe));
 112}
 113
 114static void etnaviv_buffer_dump(struct etnaviv_gpu *gpu,
 115        struct etnaviv_cmdbuf *buf, u32 off, u32 len)
 116{
 117        u32 size = buf->size;
 118        u32 *ptr = buf->vaddr + off;
 119
 120        dev_info(gpu->dev, "virt %p phys 0x%08x free 0x%08x\n",
 121                        ptr, etnaviv_cmdbuf_get_va(buf,
 122                        &gpu->mmu_context->cmdbuf_mapping) +
 123                        off, size - len * 4 - off);
 124
 125        print_hex_dump(KERN_INFO, "cmd ", DUMP_PREFIX_OFFSET, 16, 4,
 126                        ptr, len * 4, 0);
 127}
 128
 129/*
 130 * Safely replace the WAIT of a waitlink with a new command and argument.
 131 * The GPU may be executing this WAIT while we're modifying it, so we have
 132 * to write it in a specific order to avoid the GPU branching to somewhere
 133 * else.  'wl_offset' is the offset to the first byte of the WAIT command.
 134 */
 135static void etnaviv_buffer_replace_wait(struct etnaviv_cmdbuf *buffer,
 136        unsigned int wl_offset, u32 cmd, u32 arg)
 137{
 138        u32 *lw = buffer->vaddr + wl_offset;
 139
 140        lw[1] = arg;
 141        mb();
 142        lw[0] = cmd;
 143        mb();
 144}
 145
 146/*
 147 * Ensure that there is space in the command buffer to contiguously write
 148 * 'cmd_dwords' 64-bit words into the buffer, wrapping if necessary.
 149 */
 150static u32 etnaviv_buffer_reserve(struct etnaviv_gpu *gpu,
 151        struct etnaviv_cmdbuf *buffer, unsigned int cmd_dwords)
 152{
 153        if (buffer->user_size + cmd_dwords * sizeof(u64) > buffer->size)
 154                buffer->user_size = 0;
 155
 156        return etnaviv_cmdbuf_get_va(buffer,
 157                                     &gpu->mmu_context->cmdbuf_mapping) +
 158               buffer->user_size;
 159}
 160
 161u16 etnaviv_buffer_init(struct etnaviv_gpu *gpu)
 162{
 163        struct etnaviv_cmdbuf *buffer = &gpu->buffer;
 164
 165        lockdep_assert_held(&gpu->lock);
 166
 167        /* initialize buffer */
 168        buffer->user_size = 0;
 169
 170        CMD_WAIT(buffer);
 171        CMD_LINK(buffer, 2,
 172                 etnaviv_cmdbuf_get_va(buffer, &gpu->mmu_context->cmdbuf_mapping)
 173                 + buffer->user_size - 4);
 174
 175        return buffer->user_size / 8;
 176}
 177
 178u16 etnaviv_buffer_config_mmuv2(struct etnaviv_gpu *gpu, u32 mtlb_addr, u32 safe_addr)
 179{
 180        struct etnaviv_cmdbuf *buffer = &gpu->buffer;
 181
 182        lockdep_assert_held(&gpu->lock);
 183
 184        buffer->user_size = 0;
 185
 186        if (gpu->identity.features & chipFeatures_PIPE_3D) {
 187                CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
 188                               VIVS_GL_PIPE_SELECT_PIPE(ETNA_PIPE_3D));
 189                CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
 190                        mtlb_addr | VIVS_MMUv2_CONFIGURATION_MODE_MODE4_K);
 191                CMD_LOAD_STATE(buffer, VIVS_MMUv2_SAFE_ADDRESS, safe_addr);
 192                CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 193                CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 194        }
 195
 196        if (gpu->identity.features & chipFeatures_PIPE_2D) {
 197                CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
 198                               VIVS_GL_PIPE_SELECT_PIPE(ETNA_PIPE_2D));
 199                CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
 200                        mtlb_addr | VIVS_MMUv2_CONFIGURATION_MODE_MODE4_K);
 201                CMD_LOAD_STATE(buffer, VIVS_MMUv2_SAFE_ADDRESS, safe_addr);
 202                CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 203                CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 204        }
 205
 206        CMD_END(buffer);
 207
 208        buffer->user_size = ALIGN(buffer->user_size, 8);
 209
 210        return buffer->user_size / 8;
 211}
 212
 213u16 etnaviv_buffer_config_pta(struct etnaviv_gpu *gpu, unsigned short id)
 214{
 215        struct etnaviv_cmdbuf *buffer = &gpu->buffer;
 216
 217        lockdep_assert_held(&gpu->lock);
 218
 219        buffer->user_size = 0;
 220
 221        CMD_LOAD_STATE(buffer, VIVS_MMUv2_PTA_CONFIG,
 222                       VIVS_MMUv2_PTA_CONFIG_INDEX(id));
 223
 224        CMD_END(buffer);
 225
 226        buffer->user_size = ALIGN(buffer->user_size, 8);
 227
 228        return buffer->user_size / 8;
 229}
 230
 231void etnaviv_buffer_end(struct etnaviv_gpu *gpu)
 232{
 233        struct etnaviv_cmdbuf *buffer = &gpu->buffer;
 234        unsigned int waitlink_offset = buffer->user_size - 16;
 235        u32 link_target, flush = 0;
 236
 237        lockdep_assert_held(&gpu->lock);
 238
 239        if (gpu->exec_state == ETNA_PIPE_2D)
 240                flush = VIVS_GL_FLUSH_CACHE_PE2D;
 241        else if (gpu->exec_state == ETNA_PIPE_3D)
 242                flush = VIVS_GL_FLUSH_CACHE_DEPTH |
 243                        VIVS_GL_FLUSH_CACHE_COLOR |
 244                        VIVS_GL_FLUSH_CACHE_TEXTURE |
 245                        VIVS_GL_FLUSH_CACHE_TEXTUREVS |
 246                        VIVS_GL_FLUSH_CACHE_SHADER_L2;
 247
 248        if (flush) {
 249                unsigned int dwords = 7;
 250
 251                link_target = etnaviv_buffer_reserve(gpu, buffer, dwords);
 252
 253                CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 254                CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 255                CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE, flush);
 256                if (gpu->exec_state == ETNA_PIPE_3D)
 257                        CMD_LOAD_STATE(buffer, VIVS_TS_FLUSH_CACHE,
 258                                       VIVS_TS_FLUSH_CACHE_FLUSH);
 259                CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 260                CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 261                CMD_END(buffer);
 262
 263                etnaviv_buffer_replace_wait(buffer, waitlink_offset,
 264                                            VIV_FE_LINK_HEADER_OP_LINK |
 265                                            VIV_FE_LINK_HEADER_PREFETCH(dwords),
 266                                            link_target);
 267        } else {
 268                /* Replace the last link-wait with an "END" command */
 269                etnaviv_buffer_replace_wait(buffer, waitlink_offset,
 270                                            VIV_FE_END_HEADER_OP_END, 0);
 271        }
 272}
 273
 274/* Append a 'sync point' to the ring buffer. */
 275void etnaviv_sync_point_queue(struct etnaviv_gpu *gpu, unsigned int event)
 276{
 277        struct etnaviv_cmdbuf *buffer = &gpu->buffer;
 278        unsigned int waitlink_offset = buffer->user_size - 16;
 279        u32 dwords, target;
 280
 281        lockdep_assert_held(&gpu->lock);
 282
 283        /*
 284         * We need at most 3 dwords in the return target:
 285         * 1 event + 1 end + 1 wait + 1 link.
 286         */
 287        dwords = 4;
 288        target = etnaviv_buffer_reserve(gpu, buffer, dwords);
 289
 290        /* Signal sync point event */
 291        CMD_LOAD_STATE(buffer, VIVS_GL_EVENT, VIVS_GL_EVENT_EVENT_ID(event) |
 292                       VIVS_GL_EVENT_FROM_PE);
 293
 294        /* Stop the FE to 'pause' the GPU */
 295        CMD_END(buffer);
 296
 297        /* Append waitlink */
 298        CMD_WAIT(buffer);
 299        CMD_LINK(buffer, 2,
 300                 etnaviv_cmdbuf_get_va(buffer, &gpu->mmu_context->cmdbuf_mapping)
 301                 + buffer->user_size - 4);
 302
 303        /*
 304         * Kick off the 'sync point' command by replacing the previous
 305         * WAIT with a link to the address in the ring buffer.
 306         */
 307        etnaviv_buffer_replace_wait(buffer, waitlink_offset,
 308                                    VIV_FE_LINK_HEADER_OP_LINK |
 309                                    VIV_FE_LINK_HEADER_PREFETCH(dwords),
 310                                    target);
 311}
 312
 313/* Append a command buffer to the ring buffer. */
 314void etnaviv_buffer_queue(struct etnaviv_gpu *gpu, u32 exec_state,
 315        struct etnaviv_iommu_context *mmu_context, unsigned int event,
 316        struct etnaviv_cmdbuf *cmdbuf)
 317{
 318        struct etnaviv_cmdbuf *buffer = &gpu->buffer;
 319        unsigned int waitlink_offset = buffer->user_size - 16;
 320        u32 return_target, return_dwords;
 321        u32 link_target, link_dwords;
 322        bool switch_context = gpu->exec_state != exec_state;
 323        bool switch_mmu_context = gpu->mmu_context != mmu_context;
 324        unsigned int new_flush_seq = READ_ONCE(gpu->mmu_context->flush_seq);
 325        bool need_flush = switch_mmu_context || gpu->flush_seq != new_flush_seq;
 326
 327        lockdep_assert_held(&gpu->lock);
 328
 329        if (drm_debug & DRM_UT_DRIVER)
 330                etnaviv_buffer_dump(gpu, buffer, 0, 0x50);
 331
 332        link_target = etnaviv_cmdbuf_get_va(cmdbuf,
 333                                            &gpu->mmu_context->cmdbuf_mapping);
 334        link_dwords = cmdbuf->size / 8;
 335
 336        /*
 337         * If we need maintenance prior to submitting this buffer, we will
 338         * need to append a mmu flush load state, followed by a new
 339         * link to this buffer - a total of four additional words.
 340         */
 341        if (need_flush || switch_context) {
 342                u32 target, extra_dwords;
 343
 344                /* link command */
 345                extra_dwords = 1;
 346
 347                /* flush command */
 348                if (need_flush) {
 349                        if (gpu->mmu_context->global->version == ETNAVIV_IOMMU_V1)
 350                                extra_dwords += 1;
 351                        else
 352                                extra_dwords += 3;
 353                }
 354
 355                /* pipe switch commands */
 356                if (switch_context)
 357                        extra_dwords += 4;
 358
 359                /* PTA load command */
 360                if (switch_mmu_context && gpu->sec_mode == ETNA_SEC_KERNEL)
 361                        extra_dwords += 1;
 362
 363                target = etnaviv_buffer_reserve(gpu, buffer, extra_dwords);
 364                /*
 365                 * Switch MMU context if necessary. Must be done after the
 366                 * link target has been calculated, as the jump forward in the
 367                 * kernel ring still uses the last active MMU context before
 368                 * the switch.
 369                 */
 370                if (switch_mmu_context) {
 371                        struct etnaviv_iommu_context *old_context = gpu->mmu_context;
 372
 373                        etnaviv_iommu_context_get(mmu_context);
 374                        gpu->mmu_context = mmu_context;
 375                        etnaviv_iommu_context_put(old_context);
 376                }
 377
 378                if (need_flush) {
 379                        /* Add the MMU flush */
 380                        if (gpu->mmu_context->global->version == ETNAVIV_IOMMU_V1) {
 381                                CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_MMU,
 382                                               VIVS_GL_FLUSH_MMU_FLUSH_FEMMU |
 383                                               VIVS_GL_FLUSH_MMU_FLUSH_UNK1 |
 384                                               VIVS_GL_FLUSH_MMU_FLUSH_UNK2 |
 385                                               VIVS_GL_FLUSH_MMU_FLUSH_PEMMU |
 386                                               VIVS_GL_FLUSH_MMU_FLUSH_UNK4);
 387                        } else {
 388                                u32 flush = VIVS_MMUv2_CONFIGURATION_MODE_MASK |
 389                                            VIVS_MMUv2_CONFIGURATION_FLUSH_FLUSH;
 390
 391                                if (switch_mmu_context &&
 392                                    gpu->sec_mode == ETNA_SEC_KERNEL) {
 393                                        unsigned short id =
 394                                                etnaviv_iommuv2_get_pta_id(gpu->mmu_context);
 395                                        CMD_LOAD_STATE(buffer,
 396                                                VIVS_MMUv2_PTA_CONFIG,
 397                                                VIVS_MMUv2_PTA_CONFIG_INDEX(id));
 398                                }
 399
 400                                if (gpu->sec_mode == ETNA_SEC_NONE)
 401                                        flush |= etnaviv_iommuv2_get_mtlb_addr(gpu->mmu_context);
 402
 403                                CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
 404                                               flush);
 405                                CMD_SEM(buffer, SYNC_RECIPIENT_FE,
 406                                        SYNC_RECIPIENT_PE);
 407                                CMD_STALL(buffer, SYNC_RECIPIENT_FE,
 408                                        SYNC_RECIPIENT_PE);
 409                        }
 410
 411                        gpu->flush_seq = new_flush_seq;
 412                }
 413
 414                if (switch_context) {
 415                        etnaviv_cmd_select_pipe(gpu, buffer, exec_state);
 416                        gpu->exec_state = exec_state;
 417                }
 418
 419                /* And the link to the submitted buffer */
 420                link_target = etnaviv_cmdbuf_get_va(cmdbuf,
 421                                        &gpu->mmu_context->cmdbuf_mapping);
 422                CMD_LINK(buffer, link_dwords, link_target);
 423
 424                /* Update the link target to point to above instructions */
 425                link_target = target;
 426                link_dwords = extra_dwords;
 427        }
 428
 429        /*
 430         * Append a LINK to the submitted command buffer to return to
 431         * the ring buffer.  return_target is the ring target address.
 432         * We need at most 7 dwords in the return target: 2 cache flush +
 433         * 2 semaphore stall + 1 event + 1 wait + 1 link.
 434         */
 435        return_dwords = 7;
 436        return_target = etnaviv_buffer_reserve(gpu, buffer, return_dwords);
 437        CMD_LINK(cmdbuf, return_dwords, return_target);
 438
 439        /*
 440         * Append a cache flush, stall, event, wait and link pointing back to
 441         * the wait command to the ring buffer.
 442         */
 443        if (gpu->exec_state == ETNA_PIPE_2D) {
 444                CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE,
 445                                       VIVS_GL_FLUSH_CACHE_PE2D);
 446        } else {
 447                CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE,
 448                                       VIVS_GL_FLUSH_CACHE_DEPTH |
 449                                       VIVS_GL_FLUSH_CACHE_COLOR);
 450                CMD_LOAD_STATE(buffer, VIVS_TS_FLUSH_CACHE,
 451                                       VIVS_TS_FLUSH_CACHE_FLUSH);
 452        }
 453        CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 454        CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
 455        CMD_LOAD_STATE(buffer, VIVS_GL_EVENT, VIVS_GL_EVENT_EVENT_ID(event) |
 456                       VIVS_GL_EVENT_FROM_PE);
 457        CMD_WAIT(buffer);
 458        CMD_LINK(buffer, 2,
 459                 etnaviv_cmdbuf_get_va(buffer, &gpu->mmu_context->cmdbuf_mapping)
 460                 + buffer->user_size - 4);
 461
 462        if (drm_debug & DRM_UT_DRIVER)
 463                pr_info("stream link to 0x%08x @ 0x%08x %p\n",
 464                        return_target,
 465                        etnaviv_cmdbuf_get_va(cmdbuf, &gpu->mmu_context->cmdbuf_mapping),
 466                        cmdbuf->vaddr);
 467
 468        if (drm_debug & DRM_UT_DRIVER) {
 469                print_hex_dump(KERN_INFO, "cmd ", DUMP_PREFIX_OFFSET, 16, 4,
 470                               cmdbuf->vaddr, cmdbuf->size, 0);
 471
 472                pr_info("link op: %p\n", buffer->vaddr + waitlink_offset);
 473                pr_info("addr: 0x%08x\n", link_target);
 474                pr_info("back: 0x%08x\n", return_target);
 475                pr_info("event: %d\n", event);
 476        }
 477
 478        /*
 479         * Kick off the submitted command by replacing the previous
 480         * WAIT with a link to the address in the ring buffer.
 481         */
 482        etnaviv_buffer_replace_wait(buffer, waitlink_offset,
 483                                    VIV_FE_LINK_HEADER_OP_LINK |
 484                                    VIV_FE_LINK_HEADER_PREFETCH(link_dwords),
 485                                    link_target);
 486
 487        if (drm_debug & DRM_UT_DRIVER)
 488                etnaviv_buffer_dump(gpu, buffer, 0, 0x50);
 489}
 490