linux/drivers/staging/media/hantro/rk3399_vpu_hw_mpeg2_dec.c
<<
>>
Prefs
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 * Hantro VPU codec driver
   4 *
   5 * Copyright (C) 2018 Rockchip Electronics Co., Ltd.
   6 */
   7
   8#include <asm/unaligned.h>
   9#include <linux/bitfield.h>
  10#include <media/v4l2-mem2mem.h>
  11#include "hantro.h"
  12#include "hantro_hw.h"
  13
  14#define VDPU_SWREG(nr)                  ((nr) * 4)
  15
  16#define VDPU_REG_DEC_OUT_BASE           VDPU_SWREG(63)
  17#define VDPU_REG_RLC_VLC_BASE           VDPU_SWREG(64)
  18#define VDPU_REG_QTABLE_BASE            VDPU_SWREG(61)
  19#define VDPU_REG_REFER0_BASE            VDPU_SWREG(131)
  20#define VDPU_REG_REFER2_BASE            VDPU_SWREG(134)
  21#define VDPU_REG_REFER3_BASE            VDPU_SWREG(135)
  22#define VDPU_REG_REFER1_BASE            VDPU_SWREG(148)
  23#define VDPU_REG_DEC_E(v)               ((v) ? BIT(0) : 0)
  24
  25#define VDPU_REG_DEC_ADV_PRE_DIS(v)     ((v) ? BIT(11) : 0)
  26#define VDPU_REG_DEC_SCMD_DIS(v)        ((v) ? BIT(10) : 0)
  27#define VDPU_REG_FILTERING_DIS(v)       ((v) ? BIT(8) : 0)
  28#define VDPU_REG_DEC_LATENCY(v)         (((v) << 1) & GENMASK(6, 1))
  29
  30#define VDPU_REG_INIT_QP(v)             (((v) << 25) & GENMASK(30, 25))
  31#define VDPU_REG_STREAM_LEN(v)          (((v) << 0) & GENMASK(23, 0))
  32
  33#define VDPU_REG_APF_THRESHOLD(v)       (((v) << 17) & GENMASK(30, 17))
  34#define VDPU_REG_STARTMB_X(v)           (((v) << 8) & GENMASK(16, 8))
  35#define VDPU_REG_STARTMB_Y(v)           (((v) << 0) & GENMASK(7, 0))
  36
  37#define VDPU_REG_DEC_MODE(v)            (((v) << 0) & GENMASK(3, 0))
  38
  39#define VDPU_REG_DEC_STRENDIAN_E(v)     ((v) ? BIT(5) : 0)
  40#define VDPU_REG_DEC_STRSWAP32_E(v)     ((v) ? BIT(4) : 0)
  41#define VDPU_REG_DEC_OUTSWAP32_E(v)     ((v) ? BIT(3) : 0)
  42#define VDPU_REG_DEC_INSWAP32_E(v)      ((v) ? BIT(2) : 0)
  43#define VDPU_REG_DEC_OUT_ENDIAN(v)      ((v) ? BIT(1) : 0)
  44#define VDPU_REG_DEC_IN_ENDIAN(v)       ((v) ? BIT(0) : 0)
  45
  46#define VDPU_REG_DEC_DATA_DISC_E(v)     ((v) ? BIT(22) : 0)
  47#define VDPU_REG_DEC_MAX_BURST(v)       (((v) << 16) & GENMASK(20, 16))
  48#define VDPU_REG_DEC_AXI_WR_ID(v)       (((v) << 8) & GENMASK(15, 8))
  49#define VDPU_REG_DEC_AXI_RD_ID(v)       (((v) << 0) & GENMASK(7, 0))
  50
  51#define VDPU_REG_RLC_MODE_E(v)          ((v) ? BIT(20) : 0)
  52#define VDPU_REG_PIC_INTERLACE_E(v)     ((v) ? BIT(17) : 0)
  53#define VDPU_REG_PIC_FIELDMODE_E(v)     ((v) ? BIT(16) : 0)
  54#define VDPU_REG_PIC_B_E(v)             ((v) ? BIT(15) : 0)
  55#define VDPU_REG_PIC_INTER_E(v)         ((v) ? BIT(14) : 0)
  56#define VDPU_REG_PIC_TOPFIELD_E(v)      ((v) ? BIT(13) : 0)
  57#define VDPU_REG_FWD_INTERLACE_E(v)     ((v) ? BIT(12) : 0)
  58#define VDPU_REG_WRITE_MVS_E(v)         ((v) ? BIT(10) : 0)
  59#define VDPU_REG_DEC_TIMEOUT_E(v)       ((v) ? BIT(5) : 0)
  60#define VDPU_REG_DEC_CLK_GATE_E(v)      ((v) ? BIT(4) : 0)
  61
  62#define VDPU_REG_PIC_MB_WIDTH(v)        (((v) << 23) & GENMASK(31, 23))
  63#define VDPU_REG_PIC_MB_HEIGHT_P(v)     (((v) << 11) & GENMASK(18, 11))
  64#define VDPU_REG_ALT_SCAN_E(v)          ((v) ? BIT(6) : 0)
  65#define VDPU_REG_TOPFIELDFIRST_E(v)     ((v) ? BIT(5) : 0)
  66
  67#define VDPU_REG_STRM_START_BIT(v)      (((v) << 26) & GENMASK(31, 26))
  68#define VDPU_REG_QSCALE_TYPE(v)         ((v) ? BIT(24) : 0)
  69#define VDPU_REG_CON_MV_E(v)            ((v) ? BIT(4) : 0)
  70#define VDPU_REG_INTRA_DC_PREC(v)       (((v) << 2) & GENMASK(3, 2))
  71#define VDPU_REG_INTRA_VLC_TAB(v)       ((v) ? BIT(1) : 0)
  72#define VDPU_REG_FRAME_PRED_DCT(v)      ((v) ? BIT(0) : 0)
  73
  74#define VDPU_REG_ALT_SCAN_FLAG_E(v)     ((v) ? BIT(19) : 0)
  75#define VDPU_REG_FCODE_FWD_HOR(v)       (((v) << 15) & GENMASK(18, 15))
  76#define VDPU_REG_FCODE_FWD_VER(v)       (((v) << 11) & GENMASK(14, 11))
  77#define VDPU_REG_FCODE_BWD_HOR(v)       (((v) << 7) & GENMASK(10, 7))
  78#define VDPU_REG_FCODE_BWD_VER(v)       (((v) << 3) & GENMASK(6, 3))
  79#define VDPU_REG_MV_ACCURACY_FWD(v)     ((v) ? BIT(2) : 0)
  80#define VDPU_REG_MV_ACCURACY_BWD(v)     ((v) ? BIT(1) : 0)
  81
  82#define PICT_TOP_FIELD     1
  83#define PICT_BOTTOM_FIELD  2
  84#define PICT_FRAME         3
  85
  86static void
  87rk3399_vpu_mpeg2_dec_set_quantization(struct hantro_dev *vpu,
  88                                      struct hantro_ctx *ctx)
  89{
  90        struct v4l2_ctrl_mpeg2_quantization *quantization;
  91
  92        quantization = hantro_get_ctrl(ctx,
  93                                       V4L2_CID_MPEG_VIDEO_MPEG2_QUANTIZATION);
  94        hantro_mpeg2_dec_copy_qtable(ctx->mpeg2_dec.qtable.cpu, quantization);
  95        vdpu_write_relaxed(vpu, ctx->mpeg2_dec.qtable.dma,
  96                           VDPU_REG_QTABLE_BASE);
  97}
  98
  99static void
 100rk3399_vpu_mpeg2_dec_set_buffers(struct hantro_dev *vpu,
 101                                 struct hantro_ctx *ctx,
 102                                 struct vb2_buffer *src_buf,
 103                                 struct vb2_buffer *dst_buf,
 104                                 const struct v4l2_mpeg2_sequence *sequence,
 105                                 const struct v4l2_mpeg2_picture *picture,
 106                                 const struct v4l2_ctrl_mpeg2_slice_params *slice_params)
 107{
 108        dma_addr_t forward_addr = 0, backward_addr = 0;
 109        dma_addr_t current_addr, addr;
 110
 111        switch (picture->picture_coding_type) {
 112        case V4L2_MPEG2_PICTURE_CODING_TYPE_B:
 113                backward_addr = hantro_get_ref(ctx,
 114                                               slice_params->backward_ref_ts);
 115                fallthrough;
 116        case V4L2_MPEG2_PICTURE_CODING_TYPE_P:
 117                forward_addr = hantro_get_ref(ctx,
 118                                              slice_params->forward_ref_ts);
 119        }
 120
 121        /* Source bitstream buffer */
 122        addr = vb2_dma_contig_plane_dma_addr(src_buf, 0);
 123        vdpu_write_relaxed(vpu, addr, VDPU_REG_RLC_VLC_BASE);
 124
 125        /* Destination frame buffer */
 126        addr = vb2_dma_contig_plane_dma_addr(dst_buf, 0);
 127        current_addr = addr;
 128
 129        if (picture->picture_structure == PICT_BOTTOM_FIELD)
 130                addr += ALIGN(ctx->dst_fmt.width, 16);
 131        vdpu_write_relaxed(vpu, addr, VDPU_REG_DEC_OUT_BASE);
 132
 133        if (!forward_addr)
 134                forward_addr = current_addr;
 135        if (!backward_addr)
 136                backward_addr = current_addr;
 137
 138        /* Set forward ref frame (top/bottom field) */
 139        if (picture->picture_structure == PICT_FRAME ||
 140            picture->picture_coding_type == V4L2_MPEG2_PICTURE_CODING_TYPE_B ||
 141            (picture->picture_structure == PICT_TOP_FIELD &&
 142             picture->top_field_first) ||
 143            (picture->picture_structure == PICT_BOTTOM_FIELD &&
 144             !picture->top_field_first)) {
 145                vdpu_write_relaxed(vpu, forward_addr, VDPU_REG_REFER0_BASE);
 146                vdpu_write_relaxed(vpu, forward_addr, VDPU_REG_REFER1_BASE);
 147        } else if (picture->picture_structure == PICT_TOP_FIELD) {
 148                vdpu_write_relaxed(vpu, forward_addr, VDPU_REG_REFER0_BASE);
 149                vdpu_write_relaxed(vpu, current_addr, VDPU_REG_REFER1_BASE);
 150        } else if (picture->picture_structure == PICT_BOTTOM_FIELD) {
 151                vdpu_write_relaxed(vpu, current_addr, VDPU_REG_REFER0_BASE);
 152                vdpu_write_relaxed(vpu, forward_addr, VDPU_REG_REFER1_BASE);
 153        }
 154
 155        /* Set backward ref frame (top/bottom field) */
 156        vdpu_write_relaxed(vpu, backward_addr, VDPU_REG_REFER2_BASE);
 157        vdpu_write_relaxed(vpu, backward_addr, VDPU_REG_REFER3_BASE);
 158}
 159
 160void rk3399_vpu_mpeg2_dec_run(struct hantro_ctx *ctx)
 161{
 162        struct hantro_dev *vpu = ctx->dev;
 163        struct vb2_v4l2_buffer *src_buf, *dst_buf;
 164        const struct v4l2_ctrl_mpeg2_slice_params *slice_params;
 165        const struct v4l2_mpeg2_sequence *sequence;
 166        const struct v4l2_mpeg2_picture *picture;
 167        u32 reg;
 168
 169        src_buf = hantro_get_src_buf(ctx);
 170        dst_buf = hantro_get_dst_buf(ctx);
 171
 172        hantro_start_prepare_run(ctx);
 173
 174        slice_params = hantro_get_ctrl(ctx,
 175                                       V4L2_CID_MPEG_VIDEO_MPEG2_SLICE_PARAMS);
 176        sequence = &slice_params->sequence;
 177        picture = &slice_params->picture;
 178
 179        reg = VDPU_REG_DEC_ADV_PRE_DIS(0) |
 180              VDPU_REG_DEC_SCMD_DIS(0) |
 181              VDPU_REG_FILTERING_DIS(1) |
 182              VDPU_REG_DEC_LATENCY(0);
 183        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(50));
 184
 185        reg = VDPU_REG_INIT_QP(1) |
 186              VDPU_REG_STREAM_LEN(slice_params->bit_size >> 3);
 187        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(51));
 188
 189        reg = VDPU_REG_APF_THRESHOLD(8) |
 190              VDPU_REG_STARTMB_X(0) |
 191              VDPU_REG_STARTMB_Y(0);
 192        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(52));
 193
 194        reg = VDPU_REG_DEC_MODE(5);
 195        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(53));
 196
 197        reg = VDPU_REG_DEC_STRENDIAN_E(1) |
 198              VDPU_REG_DEC_STRSWAP32_E(1) |
 199              VDPU_REG_DEC_OUTSWAP32_E(1) |
 200              VDPU_REG_DEC_INSWAP32_E(1) |
 201              VDPU_REG_DEC_OUT_ENDIAN(1) |
 202              VDPU_REG_DEC_IN_ENDIAN(1);
 203        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(54));
 204
 205        reg = VDPU_REG_DEC_DATA_DISC_E(0) |
 206              VDPU_REG_DEC_MAX_BURST(16) |
 207              VDPU_REG_DEC_AXI_WR_ID(0) |
 208              VDPU_REG_DEC_AXI_RD_ID(0);
 209        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(56));
 210
 211        reg = VDPU_REG_RLC_MODE_E(0) |
 212              VDPU_REG_PIC_INTERLACE_E(!sequence->progressive_sequence) |
 213              VDPU_REG_PIC_FIELDMODE_E(picture->picture_structure != PICT_FRAME) |
 214              VDPU_REG_PIC_B_E(picture->picture_coding_type == V4L2_MPEG2_PICTURE_CODING_TYPE_B) |
 215              VDPU_REG_PIC_INTER_E(picture->picture_coding_type != V4L2_MPEG2_PICTURE_CODING_TYPE_I) |
 216              VDPU_REG_PIC_TOPFIELD_E(picture->picture_structure == PICT_TOP_FIELD) |
 217              VDPU_REG_FWD_INTERLACE_E(0) |
 218              VDPU_REG_WRITE_MVS_E(0) |
 219              VDPU_REG_DEC_TIMEOUT_E(1) |
 220              VDPU_REG_DEC_CLK_GATE_E(1);
 221        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(57));
 222
 223        reg = VDPU_REG_PIC_MB_WIDTH(MB_WIDTH(ctx->dst_fmt.width)) |
 224              VDPU_REG_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->dst_fmt.height)) |
 225              VDPU_REG_ALT_SCAN_E(picture->alternate_scan) |
 226              VDPU_REG_TOPFIELDFIRST_E(picture->top_field_first);
 227        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(120));
 228
 229        reg = VDPU_REG_STRM_START_BIT(slice_params->data_bit_offset) |
 230              VDPU_REG_QSCALE_TYPE(picture->q_scale_type) |
 231              VDPU_REG_CON_MV_E(picture->concealment_motion_vectors) |
 232              VDPU_REG_INTRA_DC_PREC(picture->intra_dc_precision) |
 233              VDPU_REG_INTRA_VLC_TAB(picture->intra_vlc_format) |
 234              VDPU_REG_FRAME_PRED_DCT(picture->frame_pred_frame_dct);
 235        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(122));
 236
 237        reg = VDPU_REG_ALT_SCAN_FLAG_E(picture->alternate_scan) |
 238              VDPU_REG_FCODE_FWD_HOR(picture->f_code[0][0]) |
 239              VDPU_REG_FCODE_FWD_VER(picture->f_code[0][1]) |
 240              VDPU_REG_FCODE_BWD_HOR(picture->f_code[1][0]) |
 241              VDPU_REG_FCODE_BWD_VER(picture->f_code[1][1]) |
 242              VDPU_REG_MV_ACCURACY_FWD(1) |
 243              VDPU_REG_MV_ACCURACY_BWD(1);
 244        vdpu_write_relaxed(vpu, reg, VDPU_SWREG(136));
 245
 246        rk3399_vpu_mpeg2_dec_set_quantization(vpu, ctx);
 247
 248        rk3399_vpu_mpeg2_dec_set_buffers(vpu, ctx, &src_buf->vb2_buf,
 249                                         &dst_buf->vb2_buf,
 250                                         sequence, picture, slice_params);
 251
 252        /* Kick the watchdog and start decoding */
 253        hantro_end_prepare_run(ctx);
 254
 255        reg = vdpu_read(vpu, VDPU_SWREG(57)) | VDPU_REG_DEC_E(1);
 256        vdpu_write(vpu, reg, VDPU_SWREG(57));
 257}
 258