mirror of
https://github.com/Fishwaldo/build.git
synced 2025-07-17 10:28:35 +00:00
* Introducing Rockchip rk322x SoC support Main features: - Legacy kernel flavour based upon stable v2.x rk3288 Rockchip branch (https://github.com/rockchip-linux/kernel/tree/stable-4.4-rk3288-linux-v2.x) - Current kernel flavour based on mainline 5.6.y kernel - Mainline u-boot (v2020.04) - Single generic tv box target (rk322x-box) which boots on all the known tv boxes - Hardware devices (eMMC/NAND, led wiring configuration, SoC variant selection) modulation done by user at runtime via device tree overlays - a script (rk322x-config) is provided for autodetection and simple configuration by inexperienced users; - Bits added to armbian-hardware-optimization to set affinity for irq handlers - rk322x-box targets already added to targets.conf for automatic image creation * Removed disabled patches * Restored mysteriously removed comment character
1525 lines
64 KiB
Diff
1525 lines
64 KiB
Diff
diff --git a/drivers/staging/media/hantro/rk3399_vpu_hw_mpeg2_dec.c b/drivers/staging/media/hantro/rk3399_vpu_hw_mpeg2_dec.c
|
|
index 7e9aad671489..b9b8194b42f2 100644
|
|
--- a/drivers/staging/media/hantro/rk3399_vpu_hw_mpeg2_dec.c
|
|
+++ b/drivers/staging/media/hantro/rk3399_vpu_hw_mpeg2_dec.c
|
|
@@ -127,7 +127,7 @@ rk3399_vpu_mpeg2_dec_set_buffers(struct hantro_dev *vpu,
|
|
current_addr = addr;
|
|
|
|
if (picture->picture_structure == PICT_BOTTOM_FIELD)
|
|
- addr += ALIGN(ctx->dst_fmt.width, 16);
|
|
+ addr += ALIGN(ctx->src_fmt.width, MB_DIM);
|
|
vdpu_write_relaxed(vpu, addr, VDPU_REG_DEC_OUT_BASE);
|
|
|
|
if (!forward_addr)
|
|
@@ -220,8 +220,8 @@ void rk3399_vpu_mpeg2_dec_run(struct hantro_ctx *ctx)
|
|
VDPU_REG_DEC_CLK_GATE_E(1);
|
|
vdpu_write_relaxed(vpu, reg, VDPU_SWREG(57));
|
|
|
|
- reg = VDPU_REG_PIC_MB_WIDTH(MB_WIDTH(ctx->dst_fmt.width)) |
|
|
- VDPU_REG_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->dst_fmt.height)) |
|
|
+ reg = VDPU_REG_PIC_MB_WIDTH(MB_WIDTH(ctx->src_fmt.width)) |
|
|
+ VDPU_REG_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->src_fmt.height)) |
|
|
VDPU_REG_ALT_SCAN_E(picture->alternate_scan) |
|
|
VDPU_REG_TOPFIELDFIRST_E(picture->top_field_first);
|
|
vdpu_write_relaxed(vpu, reg, VDPU_SWREG(120));
|
|
--
|
|
2.17.1
|
|
|
|
|
|
From 3b87f8547b97f13afb8db289cc9974760e668b79 Mon Sep 17 00:00:00 2001
|
|
From: Jonas Karlman <jonas@kwiboo.se>
|
|
Date: Tue, 5 Nov 2019 23:06:34 +0000
|
|
Subject: [PATCH] WIP: media: hantro: g1 mpeg2 src_fmt
|
|
|
|
Fixes: ceaac6dc5b7a
|
|
Signed-off-by: Jonas Karlman <jonas@kwiboo.se>
|
|
---
|
|
drivers/staging/media/hantro/hantro_g1_mpeg2_dec.c | 6 +++---
|
|
1 file changed, 3 insertions(+), 3 deletions(-)
|
|
|
|
diff --git a/drivers/staging/media/hantro/hantro_g1_mpeg2_dec.c b/drivers/staging/media/hantro/hantro_g1_mpeg2_dec.c
|
|
index 24041849384a..44f7326aba32 100644
|
|
--- a/drivers/staging/media/hantro/hantro_g1_mpeg2_dec.c
|
|
+++ b/drivers/staging/media/hantro/hantro_g1_mpeg2_dec.c
|
|
@@ -125,7 +125,7 @@ hantro_g1_mpeg2_dec_set_buffers(struct hantro_dev *vpu, struct hantro_ctx *ctx,
|
|
current_addr = addr;
|
|
|
|
if (picture->picture_structure == PICT_BOTTOM_FIELD)
|
|
- addr += ALIGN(ctx->dst_fmt.width, 16);
|
|
+ addr += ALIGN(ctx->src_fmt.width, MB_DIM);
|
|
vdpu_write_relaxed(vpu, addr, G1_REG_DEC_OUT_BASE);
|
|
|
|
if (!forward_addr)
|
|
@@ -204,8 +204,8 @@ void hantro_g1_mpeg2_dec_run(struct hantro_ctx *ctx)
|
|
G1_REG_DEC_AXI_WR_ID(0);
|
|
vdpu_write_relaxed(vpu, reg, G1_SWREG(3));
|
|
|
|
- reg = G1_REG_PIC_MB_WIDTH(MB_WIDTH(ctx->dst_fmt.width)) |
|
|
- G1_REG_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->dst_fmt.height)) |
|
|
+ reg = G1_REG_PIC_MB_WIDTH(MB_WIDTH(ctx->src_fmt.width)) |
|
|
+ G1_REG_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->src_fmt.height)) |
|
|
G1_REG_ALT_SCAN_E(picture->alternate_scan) |
|
|
G1_REG_TOPFIELDFIRST_E(picture->top_field_first);
|
|
vdpu_write_relaxed(vpu, reg, G1_SWREG(4));
|
|
--
|
|
2.17.1
|
|
|
|
|
|
From 10bf68403975d4fe3b383c7882d6a7d8a8bca64b Mon Sep 17 00:00:00 2001
|
|
From: Jonas Karlman <jonas@kwiboo.se>
|
|
Date: Tue, 5 Nov 2019 23:09:18 +0000
|
|
Subject: [PATCH] WIP: media: hantro: vp8 src_fmt
|
|
|
|
Signed-off-by: Jonas Karlman <jonas@kwiboo.se>
|
|
---
|
|
drivers/staging/media/hantro/hantro_g1_vp8_dec.c | 4 ++--
|
|
drivers/staging/media/hantro/hantro_vp8.c | 4 ++--
|
|
drivers/staging/media/hantro/rk3399_vpu_hw_vp8_dec.c | 4 ++--
|
|
3 files changed, 6 insertions(+), 6 deletions(-)
|
|
|
|
diff --git a/drivers/staging/media/hantro/hantro_g1_vp8_dec.c b/drivers/staging/media/hantro/hantro_g1_vp8_dec.c
|
|
index a5cdf150cd16..e36538117fbf 100644
|
|
--- a/drivers/staging/media/hantro/hantro_g1_vp8_dec.c
|
|
+++ b/drivers/staging/media/hantro/hantro_g1_vp8_dec.c
|
|
@@ -430,8 +430,8 @@ void hantro_g1_vp8_dec_run(struct hantro_ctx *ctx)
|
|
{
|
|
const struct v4l2_ctrl_vp8_frame_header *hdr;
|
|
struct hantro_dev *vpu = ctx->dev;
|
|
- size_t height = ctx->dst_fmt.height;
|
|
- size_t width = ctx->dst_fmt.width;
|
|
+ size_t height = ctx->src_fmt.height;
|
|
+ size_t width = ctx->src_fmt.width;
|
|
u32 mb_width, mb_height;
|
|
u32 reg;
|
|
|
|
diff --git a/drivers/staging/media/hantro/hantro_vp8.c b/drivers/staging/media/hantro/hantro_vp8.c
|
|
index 0e02d147b189..e010c9088fde 100644
|
|
--- a/drivers/staging/media/hantro/hantro_vp8.c
|
|
+++ b/drivers/staging/media/hantro/hantro_vp8.c
|
|
@@ -151,8 +151,8 @@ int hantro_vp8_dec_init(struct hantro_ctx *ctx)
|
|
int ret;
|
|
|
|
/* segment map table size calculation */
|
|
- mb_width = DIV_ROUND_UP(ctx->dst_fmt.width, 16);
|
|
- mb_height = DIV_ROUND_UP(ctx->dst_fmt.height, 16);
|
|
+ mb_width = MB_WIDTH(ctx->src_fmt.width);
|
|
+ mb_height = MB_HEIGHT(ctx->src_fmt.height);
|
|
segment_map_size = round_up(DIV_ROUND_UP(mb_width * mb_height, 4), 64);
|
|
|
|
/*
|
|
diff --git a/drivers/staging/media/hantro/rk3399_vpu_hw_vp8_dec.c b/drivers/staging/media/hantro/rk3399_vpu_hw_vp8_dec.c
|
|
index a4a792f00b11..2f553e740294 100644
|
|
--- a/drivers/staging/media/hantro/rk3399_vpu_hw_vp8_dec.c
|
|
+++ b/drivers/staging/media/hantro/rk3399_vpu_hw_vp8_dec.c
|
|
@@ -508,8 +508,8 @@ void rk3399_vpu_vp8_dec_run(struct hantro_ctx *ctx)
|
|
{
|
|
const struct v4l2_ctrl_vp8_frame_header *hdr;
|
|
struct hantro_dev *vpu = ctx->dev;
|
|
- size_t height = ctx->dst_fmt.height;
|
|
- size_t width = ctx->dst_fmt.width;
|
|
+ size_t height = ctx->src_fmt.height;
|
|
+ size_t width = ctx->src_fmt.width;
|
|
u32 mb_width, mb_height;
|
|
u32 reg;
|
|
|
|
--
|
|
2.17.1
|
|
|
|
|
|
From 4f7561c70db7347ade627ee0aacfb45c35022195 Mon Sep 17 00:00:00 2001
|
|
From: Jonas Karlman <jonas@kwiboo.se>
|
|
Date: Sun, 18 Aug 2019 10:40:31 +0000
|
|
Subject: [PATCH] media: hantro: Refactor G1 H264 code
|
|
|
|
Use generated code from my rockchip-vpu-regtool
|
|
|
|
Code could possible need some cleanup
|
|
|
|
Signed-off-by: Jonas Karlman <jonas@kwiboo.se>
|
|
---
|
|
.../staging/media/hantro/hantro_g1_h264_dec.c | 653 +++++++++++-------
|
|
drivers/staging/media/hantro/hantro_h264.c | 14 +
|
|
drivers/staging/media/hantro/hantro_hw.h | 2 +
|
|
3 files changed, 435 insertions(+), 234 deletions(-)
|
|
|
|
diff --git a/drivers/staging/media/hantro/hantro_g1_h264_dec.c b/drivers/staging/media/hantro/hantro_g1_h264_dec.c
|
|
index 89cf5741280e..20999b005307 100644
|
|
--- a/drivers/staging/media/hantro/hantro_g1_h264_dec.c
|
|
+++ b/drivers/staging/media/hantro/hantro_g1_h264_dec.c
|
|
@@ -1,6 +1,6 @@
|
|
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
- * Rockchip RK3288 VPU codec driver
|
|
+ * Hantro VPU codec driver
|
|
*
|
|
* Copyright (c) 2014 Rockchip Electronics Co., Ltd.
|
|
* Hertz Wong <hertz.wong@rock-chips.com>
|
|
@@ -15,235 +15,430 @@
|
|
|
|
#include <media/v4l2-mem2mem.h>
|
|
|
|
-#include "hantro_g1_regs.h"
|
|
#include "hantro_hw.h"
|
|
#include "hantro_v4l2.h"
|
|
|
|
-static void set_params(struct hantro_ctx *ctx)
|
|
+#define G1_SWREG(nr) ((nr) * 4)
|
|
+
|
|
+#define G1_REG_RLC_VLC_BASE G1_SWREG(12)
|
|
+#define G1_REG_DEC_OUT_BASE G1_SWREG(13)
|
|
+#define G1_REG_REFER0_BASE G1_SWREG(14)
|
|
+#define G1_REG_REFER1_BASE G1_SWREG(15)
|
|
+#define G1_REG_REFER2_BASE G1_SWREG(16)
|
|
+#define G1_REG_REFER3_BASE G1_SWREG(17)
|
|
+#define G1_REG_REFER4_BASE G1_SWREG(18)
|
|
+#define G1_REG_REFER5_BASE G1_SWREG(19)
|
|
+#define G1_REG_REFER6_BASE G1_SWREG(20)
|
|
+#define G1_REG_REFER7_BASE G1_SWREG(21)
|
|
+#define G1_REG_REFER8_BASE G1_SWREG(22)
|
|
+#define G1_REG_REFER9_BASE G1_SWREG(23)
|
|
+#define G1_REG_REFER10_BASE G1_SWREG(24)
|
|
+#define G1_REG_REFER11_BASE G1_SWREG(25)
|
|
+#define G1_REG_REFER12_BASE G1_SWREG(26)
|
|
+#define G1_REG_REFER13_BASE G1_SWREG(27)
|
|
+#define G1_REG_REFER14_BASE G1_SWREG(28)
|
|
+#define G1_REG_REFER15_BASE G1_SWREG(29)
|
|
+#define G1_REG_QTABLE_BASE G1_SWREG(40)
|
|
+#define G1_REG_DIR_MV_BASE G1_SWREG(41)
|
|
+#define G1_REG_DEC_E(v) ((v) ? BIT(0) : 0)
|
|
+
|
|
+#define G1_REG_DEC_AXI_RD_ID(v) (((v) << 24) & GENMASK(31, 24))
|
|
+#define G1_REG_DEC_TIMEOUT_E(v) ((v) ? BIT(23) : 0)
|
|
+#define G1_REG_DEC_STRSWAP32_E(v) ((v) ? BIT(22) : 0)
|
|
+#define G1_REG_DEC_STRENDIAN_E(v) ((v) ? BIT(21) : 0)
|
|
+#define G1_REG_DEC_INSWAP32_E(v) ((v) ? BIT(20) : 0)
|
|
+#define G1_REG_DEC_OUTSWAP32_E(v) ((v) ? BIT(19) : 0)
|
|
+#define G1_REG_DEC_DATA_DISC_E(v) ((v) ? BIT(18) : 0)
|
|
+#define G1_REG_DEC_LATENCY(v) (((v) << 11) & GENMASK(16, 11))
|
|
+#define G1_REG_DEC_CLK_GATE_E(v) ((v) ? BIT(10) : 0)
|
|
+#define G1_REG_DEC_IN_ENDIAN(v) ((v) ? BIT(9) : 0)
|
|
+#define G1_REG_DEC_OUT_ENDIAN(v) ((v) ? BIT(8) : 0)
|
|
+#define G1_REG_DEC_ADV_PRE_DIS(v) ((v) ? BIT(6) : 0)
|
|
+#define G1_REG_DEC_SCMD_DIS(v) ((v) ? BIT(5) : 0)
|
|
+#define G1_REG_DEC_MAX_BURST(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_DEC_MODE(v) (((v) << 28) & GENMASK(31, 28))
|
|
+#define G1_REG_RLC_MODE_E(v) ((v) ? BIT(27) : 0)
|
|
+#define G1_REG_PIC_INTERLACE_E(v) ((v) ? BIT(23) : 0)
|
|
+#define G1_REG_PIC_FIELDMODE_E(v) ((v) ? BIT(22) : 0)
|
|
+#define G1_REG_PIC_TOPFIELD_E(v) ((v) ? BIT(19) : 0)
|
|
+#define G1_REG_FILTERING_DIS(v) ((v) ? BIT(14) : 0)
|
|
+#define G1_REG_PIC_FIXED_QUANT(v) ((v) ? BIT(13) : 0)
|
|
+#define G1_REG_WRITE_MVS_E(v) ((v) ? BIT(12) : 0)
|
|
+#define G1_REG_SEQ_MBAFF_E(v) ((v) ? BIT(10) : 0)
|
|
+#define G1_REG_PICORD_COUNT_E(v) ((v) ? BIT(9) : 0)
|
|
+#define G1_REG_DEC_AXI_WR_ID(v) (((v) << 0) & GENMASK(7, 0))
|
|
+
|
|
+#define G1_REG_PIC_MB_WIDTH(v) (((v) << 23) & GENMASK(31, 23))
|
|
+#define G1_REG_PIC_MB_HEIGHT_P(v) (((v) << 11) & GENMASK(18, 11))
|
|
+#define G1_REG_REF_FRAMES(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_STRM_START_BIT(v) (((v) << 26) & GENMASK(31, 26))
|
|
+#define G1_REG_TYPE1_QUANT_E(v) ((v) ? BIT(24) : 0)
|
|
+#define G1_REG_CH_QP_OFFSET(v) (((v) << 19) & GENMASK(23, 19))
|
|
+#define G1_REG_CH_QP_OFFSET2(v) (((v) << 14) & GENMASK(18, 14))
|
|
+#define G1_REG_FIELDPIC_FLAG_E(v) ((v) ? BIT(0) : 0)
|
|
+
|
|
+#define G1_REG_START_CODE_E(v) ((v) ? BIT(31) : 0)
|
|
+#define G1_REG_INIT_QP(v) (((v) << 25) & GENMASK(30, 25))
|
|
+#define G1_REG_CH_8PIX_ILEAV_E(v) ((v) ? BIT(24) : 0)
|
|
+#define G1_REG_STREAM_LEN(v) (((v) << 0) & GENMASK(23, 0))
|
|
+
|
|
+#define G1_REG_CABAC_E(v) ((v) ? BIT(31) : 0)
|
|
+#define G1_REG_BLACKWHITE_E(v) ((v) ? BIT(30) : 0)
|
|
+#define G1_REG_DIR_8X8_INFER_E(v) ((v) ? BIT(29) : 0)
|
|
+#define G1_REG_WEIGHT_PRED_E(v) ((v) ? BIT(28) : 0)
|
|
+#define G1_REG_WEIGHT_BIPR_IDC(v) (((v) << 26) & GENMASK(27, 26))
|
|
+#define G1_REG_FRAMENUM_LEN(v) (((v) << 16) & GENMASK(20, 16))
|
|
+#define G1_REG_FRAMENUM(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_CONST_INTRA_E(v) ((v) ? BIT(31) : 0)
|
|
+#define G1_REG_FILT_CTRL_PRES(v) ((v) ? BIT(30) : 0)
|
|
+#define G1_REG_RDPIC_CNT_PRES(v) ((v) ? BIT(29) : 0)
|
|
+#define G1_REG_8X8TRANS_FLAG_E(v) ((v) ? BIT(28) : 0)
|
|
+#define G1_REG_REFPIC_MK_LEN(v) (((v) << 17) & GENMASK(27, 17))
|
|
+#define G1_REG_IDR_PIC_E(v) ((v) ? BIT(16) : 0)
|
|
+#define G1_REG_IDR_PIC_ID(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_PPS_ID(v) (((v) << 24) & GENMASK(31, 24))
|
|
+#define G1_REG_REFIDX1_ACTIVE(v) (((v) << 19) & GENMASK(23, 19))
|
|
+#define G1_REG_REFIDX0_ACTIVE(v) (((v) << 14) & GENMASK(18, 14))
|
|
+#define G1_REG_POC_LENGTH(v) (((v) << 0) & GENMASK(7, 0))
|
|
+
|
|
+#define G1_REG_PINIT_RLIST_F9(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_PINIT_RLIST_F8(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_PINIT_RLIST_F7(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_PINIT_RLIST_F6(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_PINIT_RLIST_F5(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_PINIT_RLIST_F4(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_PINIT_RLIST_F15(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_PINIT_RLIST_F14(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_PINIT_RLIST_F13(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_PINIT_RLIST_F12(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_PINIT_RLIST_F11(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_PINIT_RLIST_F10(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_REFER1_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER0_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER3_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER2_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER5_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER4_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER7_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER6_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER9_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER8_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER11_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER10_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER13_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER12_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER15_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define G1_REG_REFER14_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define G1_REG_REFER_LTERM_E(v) (((v) << 0) & GENMASK(31, 0))
|
|
+
|
|
+#define G1_REG_REFER_VALID_E(v) (((v) << 0) & GENMASK(31, 0))
|
|
+
|
|
+#define G1_REG_BINIT_RLIST_B2(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_BINIT_RLIST_F2(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_BINIT_RLIST_B1(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_BINIT_RLIST_F1(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_BINIT_RLIST_B0(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_BINIT_RLIST_F0(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_BINIT_RLIST_B5(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_BINIT_RLIST_F5(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_BINIT_RLIST_B4(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_BINIT_RLIST_F4(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_BINIT_RLIST_B3(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_BINIT_RLIST_F3(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_BINIT_RLIST_B8(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_BINIT_RLIST_F8(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_BINIT_RLIST_B7(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_BINIT_RLIST_F7(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_BINIT_RLIST_B6(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_BINIT_RLIST_F6(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_BINIT_RLIST_B11(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_BINIT_RLIST_F11(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_BINIT_RLIST_B10(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_BINIT_RLIST_F10(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_BINIT_RLIST_B9(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_BINIT_RLIST_F9(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_BINIT_RLIST_B14(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_BINIT_RLIST_F14(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_BINIT_RLIST_B13(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_BINIT_RLIST_F13(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_BINIT_RLIST_B12(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_BINIT_RLIST_F12(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_PINIT_RLIST_F3(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define G1_REG_PINIT_RLIST_F2(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define G1_REG_PINIT_RLIST_F1(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define G1_REG_PINIT_RLIST_F0(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define G1_REG_BINIT_RLIST_B15(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define G1_REG_BINIT_RLIST_F15(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define G1_REG_STARTMB_X(v) (((v) << 23) & GENMASK(31, 23))
|
|
+#define G1_REG_STARTMB_Y(v) (((v) << 15) & GENMASK(22, 15))
|
|
+
|
|
+#define G1_REG_PRED_BC_TAP_0_0(v) (((v) << 22) & GENMASK(31, 22))
|
|
+#define G1_REG_PRED_BC_TAP_0_1(v) (((v) << 12) & GENMASK(21, 12))
|
|
+#define G1_REG_PRED_BC_TAP_0_2(v) (((v) << 2) & GENMASK(11, 2))
|
|
+
|
|
+#define G1_REG_REFBU_E(v) ((v) ? BIT(31) : 0)
|
|
+
|
|
+#define G1_REG_APF_THRESHOLD(v) (((v) << 0) & GENMASK(13, 0))
|
|
+
|
|
+void hantro_g1_h264_dec_run(struct hantro_ctx *ctx)
|
|
{
|
|
- const struct hantro_h264_dec_ctrls *ctrls = &ctx->h264_dec.ctrls;
|
|
- const struct v4l2_ctrl_h264_decode_params *dec_param = ctrls->decode;
|
|
- const struct v4l2_ctrl_h264_slice_params *slices = ctrls->slices;
|
|
- const struct v4l2_ctrl_h264_sps *sps = ctrls->sps;
|
|
- const struct v4l2_ctrl_h264_pps *pps = ctrls->pps;
|
|
- struct vb2_v4l2_buffer *src_buf = hantro_get_src_buf(ctx);
|
|
struct hantro_dev *vpu = ctx->dev;
|
|
+ struct vb2_v4l2_buffer *src_buf, *dst_buf;
|
|
+ const struct hantro_h264_dec_ctrls *ctrls;
|
|
+ const struct v4l2_ctrl_h264_decode_params *decode;
|
|
+ const struct v4l2_ctrl_h264_slice_params *slices;
|
|
+ const struct v4l2_ctrl_h264_sps *sps;
|
|
+ const struct v4l2_ctrl_h264_pps *pps;
|
|
+ const u8 *b0_reflist, *b1_reflist, *p_reflist;
|
|
+ dma_addr_t addr;
|
|
+ size_t offset = 0;
|
|
u32 reg;
|
|
|
|
- /* Decoder control register 0. */
|
|
- reg = G1_REG_DEC_CTRL0_DEC_AXI_WR_ID(0x0);
|
|
- if (sps->flags & V4L2_H264_SPS_FLAG_MB_ADAPTIVE_FRAME_FIELD)
|
|
- reg |= G1_REG_DEC_CTRL0_SEQ_MBAFF_E;
|
|
- if (sps->profile_idc > 66) {
|
|
- reg |= G1_REG_DEC_CTRL0_PICORD_COUNT_E;
|
|
- if (dec_param->nal_ref_idc)
|
|
- reg |= G1_REG_DEC_CTRL0_WRITE_MVS_E;
|
|
- }
|
|
+ /* Prepare the H264 decoder context. */
|
|
+ if (hantro_h264_dec_prepare_run(ctx))
|
|
+ return;
|
|
|
|
- if (!(sps->flags & V4L2_H264_SPS_FLAG_FRAME_MBS_ONLY) &&
|
|
- (sps->flags & V4L2_H264_SPS_FLAG_MB_ADAPTIVE_FRAME_FIELD ||
|
|
- slices[0].flags & V4L2_H264_SLICE_FLAG_FIELD_PIC))
|
|
- reg |= G1_REG_DEC_CTRL0_PIC_INTERLACE_E;
|
|
- if (slices[0].flags & V4L2_H264_SLICE_FLAG_FIELD_PIC)
|
|
- reg |= G1_REG_DEC_CTRL0_PIC_FIELDMODE_E;
|
|
- if (!(slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD))
|
|
- reg |= G1_REG_DEC_CTRL0_PIC_TOPFIELD_E;
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_DEC_CTRL0);
|
|
-
|
|
- /* Decoder control register 1. */
|
|
- reg = G1_REG_DEC_CTRL1_PIC_MB_WIDTH(MB_WIDTH(ctx->src_fmt.width)) |
|
|
- G1_REG_DEC_CTRL1_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->src_fmt.height)) |
|
|
- G1_REG_DEC_CTRL1_REF_FRAMES(sps->max_num_ref_frames);
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_DEC_CTRL1);
|
|
-
|
|
- /* Decoder control register 2. */
|
|
- reg = G1_REG_DEC_CTRL2_CH_QP_OFFSET(pps->chroma_qp_index_offset) |
|
|
- G1_REG_DEC_CTRL2_CH_QP_OFFSET2(pps->second_chroma_qp_index_offset);
|
|
-
|
|
- /* always use the matrix sent from userspace */
|
|
- reg |= G1_REG_DEC_CTRL2_TYPE1_QUANT_E;
|
|
-
|
|
- if (!(sps->flags & V4L2_H264_SPS_FLAG_FRAME_MBS_ONLY))
|
|
- reg |= G1_REG_DEC_CTRL2_FIELDPIC_FLAG_E;
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_DEC_CTRL2);
|
|
-
|
|
- /* Decoder control register 3. */
|
|
- reg = G1_REG_DEC_CTRL3_START_CODE_E |
|
|
- G1_REG_DEC_CTRL3_INIT_QP(pps->pic_init_qp_minus26 + 26) |
|
|
- G1_REG_DEC_CTRL3_STREAM_LEN(vb2_get_plane_payload(&src_buf->vb2_buf, 0));
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_DEC_CTRL3);
|
|
-
|
|
- /* Decoder control register 4. */
|
|
- reg = G1_REG_DEC_CTRL4_FRAMENUM_LEN(sps->log2_max_frame_num_minus4 + 4) |
|
|
- G1_REG_DEC_CTRL4_FRAMENUM(slices[0].frame_num) |
|
|
- G1_REG_DEC_CTRL4_WEIGHT_BIPR_IDC(pps->weighted_bipred_idc);
|
|
- if (pps->flags & V4L2_H264_PPS_FLAG_ENTROPY_CODING_MODE)
|
|
- reg |= G1_REG_DEC_CTRL4_CABAC_E;
|
|
- if (sps->flags & V4L2_H264_SPS_FLAG_DIRECT_8X8_INFERENCE)
|
|
- reg |= G1_REG_DEC_CTRL4_DIR_8X8_INFER_E;
|
|
- if (sps->profile_idc >= 100 && sps->chroma_format_idc == 0)
|
|
- reg |= G1_REG_DEC_CTRL4_BLACKWHITE_E;
|
|
- if (pps->flags & V4L2_H264_PPS_FLAG_WEIGHTED_PRED)
|
|
- reg |= G1_REG_DEC_CTRL4_WEIGHT_PRED_E;
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_DEC_CTRL4);
|
|
-
|
|
- /* Decoder control register 5. */
|
|
- reg = G1_REG_DEC_CTRL5_REFPIC_MK_LEN(slices[0].dec_ref_pic_marking_bit_size) |
|
|
- G1_REG_DEC_CTRL5_IDR_PIC_ID(slices[0].idr_pic_id);
|
|
- if (pps->flags & V4L2_H264_PPS_FLAG_CONSTRAINED_INTRA_PRED)
|
|
- reg |= G1_REG_DEC_CTRL5_CONST_INTRA_E;
|
|
- if (pps->flags & V4L2_H264_PPS_FLAG_DEBLOCKING_FILTER_CONTROL_PRESENT)
|
|
- reg |= G1_REG_DEC_CTRL5_FILT_CTRL_PRES;
|
|
- if (pps->flags & V4L2_H264_PPS_FLAG_REDUNDANT_PIC_CNT_PRESENT)
|
|
- reg |= G1_REG_DEC_CTRL5_RDPIC_CNT_PRES;
|
|
- if (pps->flags & V4L2_H264_PPS_FLAG_TRANSFORM_8X8_MODE)
|
|
- reg |= G1_REG_DEC_CTRL5_8X8TRANS_FLAG_E;
|
|
- if (dec_param->flags & V4L2_H264_DECODE_PARAM_FLAG_IDR_PIC)
|
|
- reg |= G1_REG_DEC_CTRL5_IDR_PIC_E;
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_DEC_CTRL5);
|
|
-
|
|
- /* Decoder control register 6. */
|
|
- reg = G1_REG_DEC_CTRL6_PPS_ID(slices[0].pic_parameter_set_id) |
|
|
- G1_REG_DEC_CTRL6_REFIDX0_ACTIVE(pps->num_ref_idx_l0_default_active_minus1 + 1) |
|
|
- G1_REG_DEC_CTRL6_REFIDX1_ACTIVE(pps->num_ref_idx_l1_default_active_minus1 + 1) |
|
|
- G1_REG_DEC_CTRL6_POC_LENGTH(slices[0].pic_order_cnt_bit_size);
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_DEC_CTRL6);
|
|
-
|
|
- /* Error concealment register. */
|
|
- vdpu_write_relaxed(vpu, 0, G1_REG_ERR_CONC);
|
|
-
|
|
- /* Prediction filter tap register. */
|
|
- vdpu_write_relaxed(vpu,
|
|
- G1_REG_PRED_FLT_PRED_BC_TAP_0_0(1) |
|
|
- G1_REG_PRED_FLT_PRED_BC_TAP_0_1(-5 & 0x3ff) |
|
|
- G1_REG_PRED_FLT_PRED_BC_TAP_0_2(20),
|
|
- G1_REG_PRED_FLT);
|
|
-
|
|
- /* Reference picture buffer control register. */
|
|
- vdpu_write_relaxed(vpu, 0, G1_REG_REF_BUF_CTRL);
|
|
-
|
|
- /* Reference picture buffer control register 2. */
|
|
- vdpu_write_relaxed(vpu, G1_REG_REF_BUF_CTRL2_APF_THRESHOLD(8),
|
|
- G1_REG_REF_BUF_CTRL2);
|
|
-}
|
|
+ src_buf = hantro_get_src_buf(ctx);
|
|
+ dst_buf = hantro_get_dst_buf(ctx);
|
|
|
|
-static void set_ref(struct hantro_ctx *ctx)
|
|
-{
|
|
- struct v4l2_h264_dpb_entry *dpb = ctx->h264_dec.dpb;
|
|
- const u8 *b0_reflist, *b1_reflist, *p_reflist;
|
|
- struct hantro_dev *vpu = ctx->dev;
|
|
- int reg_num;
|
|
- u32 reg;
|
|
- int i;
|
|
-
|
|
- vdpu_write_relaxed(vpu, ctx->h264_dec.dpb_valid, G1_REG_VALID_REF);
|
|
- vdpu_write_relaxed(vpu, ctx->h264_dec.dpb_longterm, G1_REG_LT_REF);
|
|
-
|
|
- /*
|
|
- * Set up reference frame picture numbers.
|
|
- *
|
|
- * Each G1_REG_REF_PIC(x) register contains numbers of two
|
|
- * subsequential reference pictures.
|
|
- */
|
|
- for (i = 0; i < HANTRO_H264_DPB_SIZE; i += 2) {
|
|
- reg = 0;
|
|
- if (dpb[i].flags & V4L2_H264_DPB_ENTRY_FLAG_LONG_TERM)
|
|
- reg |= G1_REG_REF_PIC_REFER0_NBR(dpb[i].pic_num);
|
|
- else
|
|
- reg |= G1_REG_REF_PIC_REFER0_NBR(dpb[i].frame_num);
|
|
-
|
|
- if (dpb[i + 1].flags & V4L2_H264_DPB_ENTRY_FLAG_LONG_TERM)
|
|
- reg |= G1_REG_REF_PIC_REFER1_NBR(dpb[i + 1].pic_num);
|
|
- else
|
|
- reg |= G1_REG_REF_PIC_REFER1_NBR(dpb[i + 1].frame_num);
|
|
-
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_REF_PIC(i / 2));
|
|
- }
|
|
+ ctrls = &ctx->h264_dec.ctrls;
|
|
+ decode = ctrls->decode;
|
|
+ slices = ctrls->slices;
|
|
+ sps = ctrls->sps;
|
|
+ pps = ctrls->pps;
|
|
|
|
b0_reflist = ctx->h264_dec.reflists.b0;
|
|
b1_reflist = ctx->h264_dec.reflists.b1;
|
|
p_reflist = ctx->h264_dec.reflists.p;
|
|
|
|
- /*
|
|
- * Each G1_REG_BD_REF_PIC(x) register contains three entries
|
|
- * of each forward and backward picture list.
|
|
- */
|
|
- reg_num = 0;
|
|
- for (i = 0; i < 15; i += 3) {
|
|
- reg = G1_REG_BD_REF_PIC_BINIT_RLIST_F0(b0_reflist[i]) |
|
|
- G1_REG_BD_REF_PIC_BINIT_RLIST_F1(b0_reflist[i + 1]) |
|
|
- G1_REG_BD_REF_PIC_BINIT_RLIST_F2(b0_reflist[i + 2]) |
|
|
- G1_REG_BD_REF_PIC_BINIT_RLIST_B0(b1_reflist[i]) |
|
|
- G1_REG_BD_REF_PIC_BINIT_RLIST_B1(b1_reflist[i + 1]) |
|
|
- G1_REG_BD_REF_PIC_BINIT_RLIST_B2(b1_reflist[i + 2]);
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_BD_REF_PIC(reg_num++));
|
|
- }
|
|
-
|
|
- /*
|
|
- * G1_REG_BD_P_REF_PIC register contains last entries (index 15)
|
|
- * of forward and backward reference picture lists and first 4 entries
|
|
- * of P forward picture list.
|
|
- */
|
|
- reg = G1_REG_BD_P_REF_PIC_BINIT_RLIST_F15(b0_reflist[15]) |
|
|
- G1_REG_BD_P_REF_PIC_BINIT_RLIST_B15(b1_reflist[15]) |
|
|
- G1_REG_BD_P_REF_PIC_PINIT_RLIST_F0(p_reflist[0]) |
|
|
- G1_REG_BD_P_REF_PIC_PINIT_RLIST_F1(p_reflist[1]) |
|
|
- G1_REG_BD_P_REF_PIC_PINIT_RLIST_F2(p_reflist[2]) |
|
|
- G1_REG_BD_P_REF_PIC_PINIT_RLIST_F3(p_reflist[3]);
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_BD_P_REF_PIC);
|
|
-
|
|
- /*
|
|
- * Each G1_REG_FWD_PIC(x) register contains six consecutive
|
|
- * entries of P forward picture list, starting from index 4.
|
|
- */
|
|
- reg_num = 0;
|
|
- for (i = 4; i < HANTRO_H264_DPB_SIZE; i += 6) {
|
|
- reg = G1_REG_FWD_PIC_PINIT_RLIST_F0(p_reflist[i]) |
|
|
- G1_REG_FWD_PIC_PINIT_RLIST_F1(p_reflist[i + 1]) |
|
|
- G1_REG_FWD_PIC_PINIT_RLIST_F2(p_reflist[i + 2]) |
|
|
- G1_REG_FWD_PIC_PINIT_RLIST_F3(p_reflist[i + 3]) |
|
|
- G1_REG_FWD_PIC_PINIT_RLIST_F4(p_reflist[i + 4]) |
|
|
- G1_REG_FWD_PIC_PINIT_RLIST_F5(p_reflist[i + 5]);
|
|
- vdpu_write_relaxed(vpu, reg, G1_REG_FWD_PIC(reg_num++));
|
|
- }
|
|
+ reg = G1_REG_DEC_AXI_RD_ID(0xff) |
|
|
+ G1_REG_DEC_TIMEOUT_E(1) |
|
|
+ G1_REG_DEC_STRSWAP32_E(1) |
|
|
+ G1_REG_DEC_STRENDIAN_E(1) |
|
|
+ G1_REG_DEC_INSWAP32_E(1) |
|
|
+ G1_REG_DEC_OUTSWAP32_E(1) |
|
|
+ G1_REG_DEC_DATA_DISC_E(0) |
|
|
+ G1_REG_DEC_LATENCY(0) |
|
|
+ G1_REG_DEC_CLK_GATE_E(1) |
|
|
+ G1_REG_DEC_IN_ENDIAN(0) |
|
|
+ G1_REG_DEC_OUT_ENDIAN(1) |
|
|
+ G1_REG_DEC_ADV_PRE_DIS(0) |
|
|
+ G1_REG_DEC_SCMD_DIS(0) |
|
|
+ G1_REG_DEC_MAX_BURST(16);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(2));
|
|
+
|
|
+ reg = G1_REG_DEC_MODE(0) |
|
|
+ G1_REG_RLC_MODE_E(0) |
|
|
+ G1_REG_PIC_INTERLACE_E(!(sps->flags & V4L2_H264_SPS_FLAG_FRAME_MBS_ONLY) && (sps->flags & V4L2_H264_SPS_FLAG_MB_ADAPTIVE_FRAME_FIELD || slices[0].flags & V4L2_H264_SLICE_FLAG_FIELD_PIC)) |
|
|
+ G1_REG_PIC_FIELDMODE_E(slices[0].flags & V4L2_H264_SLICE_FLAG_FIELD_PIC) |
|
|
+ G1_REG_PIC_TOPFIELD_E(!(slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)) |
|
|
+ G1_REG_FILTERING_DIS(0) |
|
|
+ G1_REG_PIC_FIXED_QUANT(0) |
|
|
+ G1_REG_WRITE_MVS_E(sps->profile_idc > 66 && decode->nal_ref_idc) |
|
|
+ G1_REG_SEQ_MBAFF_E(sps->flags & V4L2_H264_SPS_FLAG_MB_ADAPTIVE_FRAME_FIELD) |
|
|
+ G1_REG_PICORD_COUNT_E(sps->profile_idc > 66) |
|
|
+ G1_REG_DEC_AXI_WR_ID(0);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(3));
|
|
+
|
|
+ reg = G1_REG_PIC_MB_WIDTH(MB_WIDTH(ctx->src_fmt.width)) |
|
|
+ G1_REG_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->src_fmt.height)) |
|
|
+ G1_REG_REF_FRAMES(sps->max_num_ref_frames);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(4));
|
|
+
|
|
+ reg = G1_REG_STRM_START_BIT(0) |
|
|
+ G1_REG_TYPE1_QUANT_E(1) |
|
|
+ G1_REG_CH_QP_OFFSET(pps->chroma_qp_index_offset) |
|
|
+ G1_REG_CH_QP_OFFSET2(pps->second_chroma_qp_index_offset) |
|
|
+ G1_REG_FIELDPIC_FLAG_E(!(sps->flags & V4L2_H264_SPS_FLAG_FRAME_MBS_ONLY));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(5));
|
|
+
|
|
+ reg = G1_REG_START_CODE_E(1) |
|
|
+ G1_REG_INIT_QP(pps->pic_init_qp_minus26 + 26) |
|
|
+ G1_REG_CH_8PIX_ILEAV_E(0) |
|
|
+ G1_REG_STREAM_LEN(vb2_get_plane_payload(&src_buf->vb2_buf, 0));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(6));
|
|
+
|
|
+ reg = G1_REG_CABAC_E(pps->flags & V4L2_H264_PPS_FLAG_ENTROPY_CODING_MODE) |
|
|
+ G1_REG_BLACKWHITE_E(sps->profile_idc >= 100 && sps->chroma_format_idc == 0) |
|
|
+ G1_REG_DIR_8X8_INFER_E(sps->flags & V4L2_H264_SPS_FLAG_DIRECT_8X8_INFERENCE) |
|
|
+ G1_REG_WEIGHT_PRED_E(pps->flags & V4L2_H264_PPS_FLAG_WEIGHTED_PRED) |
|
|
+ G1_REG_WEIGHT_BIPR_IDC(pps->weighted_bipred_idc) |
|
|
+ G1_REG_FRAMENUM_LEN(sps->log2_max_frame_num_minus4 + 4) |
|
|
+ G1_REG_FRAMENUM(slices[0].frame_num);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(7));
|
|
+
|
|
+ reg = G1_REG_CONST_INTRA_E(pps->flags & V4L2_H264_PPS_FLAG_CONSTRAINED_INTRA_PRED) |
|
|
+ G1_REG_FILT_CTRL_PRES(pps->flags & V4L2_H264_PPS_FLAG_DEBLOCKING_FILTER_CONTROL_PRESENT) |
|
|
+ G1_REG_RDPIC_CNT_PRES(pps->flags & V4L2_H264_PPS_FLAG_REDUNDANT_PIC_CNT_PRESENT) |
|
|
+ G1_REG_8X8TRANS_FLAG_E(pps->flags & V4L2_H264_PPS_FLAG_TRANSFORM_8X8_MODE) |
|
|
+ G1_REG_REFPIC_MK_LEN(slices[0].dec_ref_pic_marking_bit_size) |
|
|
+ G1_REG_IDR_PIC_E(decode->flags & V4L2_H264_DECODE_PARAM_FLAG_IDR_PIC) |
|
|
+ G1_REG_IDR_PIC_ID(slices[0].idr_pic_id);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(8));
|
|
+
|
|
+ reg = G1_REG_PPS_ID(slices[0].pic_parameter_set_id) |
|
|
+ G1_REG_REFIDX1_ACTIVE(pps->num_ref_idx_l1_default_active_minus1 + 1) |
|
|
+ G1_REG_REFIDX0_ACTIVE(pps->num_ref_idx_l0_default_active_minus1 + 1) |
|
|
+ G1_REG_POC_LENGTH(slices[0].pic_order_cnt_bit_size);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(9));
|
|
+
|
|
+ reg = G1_REG_PINIT_RLIST_F9(p_reflist[9]) |
|
|
+ G1_REG_PINIT_RLIST_F8(p_reflist[8]) |
|
|
+ G1_REG_PINIT_RLIST_F7(p_reflist[7]) |
|
|
+ G1_REG_PINIT_RLIST_F6(p_reflist[6]) |
|
|
+ G1_REG_PINIT_RLIST_F5(p_reflist[5]) |
|
|
+ G1_REG_PINIT_RLIST_F4(p_reflist[4]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(10));
|
|
+
|
|
+ reg = G1_REG_PINIT_RLIST_F15(p_reflist[15]) |
|
|
+ G1_REG_PINIT_RLIST_F14(p_reflist[14]) |
|
|
+ G1_REG_PINIT_RLIST_F13(p_reflist[13]) |
|
|
+ G1_REG_PINIT_RLIST_F12(p_reflist[12]) |
|
|
+ G1_REG_PINIT_RLIST_F11(p_reflist[11]) |
|
|
+ G1_REG_PINIT_RLIST_F10(p_reflist[10]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(11));
|
|
+
|
|
+ reg = G1_REG_REFER1_NBR(hantro_h264_get_ref_nbr(ctx, 1)) |
|
|
+ G1_REG_REFER0_NBR(hantro_h264_get_ref_nbr(ctx, 0));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(30));
|
|
+
|
|
+ reg = G1_REG_REFER3_NBR(hantro_h264_get_ref_nbr(ctx, 3)) |
|
|
+ G1_REG_REFER2_NBR(hantro_h264_get_ref_nbr(ctx, 2));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(31));
|
|
+
|
|
+ reg = G1_REG_REFER5_NBR(hantro_h264_get_ref_nbr(ctx, 5)) |
|
|
+ G1_REG_REFER4_NBR(hantro_h264_get_ref_nbr(ctx, 4));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(32));
|
|
+
|
|
+ reg = G1_REG_REFER7_NBR(hantro_h264_get_ref_nbr(ctx, 7)) |
|
|
+ G1_REG_REFER6_NBR(hantro_h264_get_ref_nbr(ctx, 6));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(33));
|
|
+
|
|
+ reg = G1_REG_REFER9_NBR(hantro_h264_get_ref_nbr(ctx, 9)) |
|
|
+ G1_REG_REFER8_NBR(hantro_h264_get_ref_nbr(ctx, 8));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(34));
|
|
+
|
|
+ reg = G1_REG_REFER11_NBR(hantro_h264_get_ref_nbr(ctx, 11)) |
|
|
+ G1_REG_REFER10_NBR(hantro_h264_get_ref_nbr(ctx, 10));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(35));
|
|
+
|
|
+ reg = G1_REG_REFER13_NBR(hantro_h264_get_ref_nbr(ctx, 13)) |
|
|
+ G1_REG_REFER12_NBR(hantro_h264_get_ref_nbr(ctx, 12));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(36));
|
|
+
|
|
+ reg = G1_REG_REFER15_NBR(hantro_h264_get_ref_nbr(ctx, 15)) |
|
|
+ G1_REG_REFER14_NBR(hantro_h264_get_ref_nbr(ctx, 14));
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(37));
|
|
+
|
|
+ reg = G1_REG_REFER_LTERM_E(ctx->h264_dec.dpb_longterm);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(38));
|
|
+
|
|
+ reg = G1_REG_REFER_VALID_E(ctx->h264_dec.dpb_valid);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(39));
|
|
+
|
|
+ reg = G1_REG_BINIT_RLIST_B2(b1_reflist[2]) |
|
|
+ G1_REG_BINIT_RLIST_F2(b0_reflist[2]) |
|
|
+ G1_REG_BINIT_RLIST_B1(b1_reflist[1]) |
|
|
+ G1_REG_BINIT_RLIST_F1(b0_reflist[1]) |
|
|
+ G1_REG_BINIT_RLIST_B0(b1_reflist[0]) |
|
|
+ G1_REG_BINIT_RLIST_F0(b0_reflist[0]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(42));
|
|
+
|
|
+ reg = G1_REG_BINIT_RLIST_B5(b1_reflist[5]) |
|
|
+ G1_REG_BINIT_RLIST_F5(b0_reflist[5]) |
|
|
+ G1_REG_BINIT_RLIST_B4(b1_reflist[4]) |
|
|
+ G1_REG_BINIT_RLIST_F4(b0_reflist[4]) |
|
|
+ G1_REG_BINIT_RLIST_B3(b1_reflist[3]) |
|
|
+ G1_REG_BINIT_RLIST_F3(b0_reflist[3]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(43));
|
|
+
|
|
+ reg = G1_REG_BINIT_RLIST_B8(b1_reflist[8]) |
|
|
+ G1_REG_BINIT_RLIST_F8(b0_reflist[8]) |
|
|
+ G1_REG_BINIT_RLIST_B7(b1_reflist[7]) |
|
|
+ G1_REG_BINIT_RLIST_F7(b0_reflist[7]) |
|
|
+ G1_REG_BINIT_RLIST_B6(b1_reflist[6]) |
|
|
+ G1_REG_BINIT_RLIST_F6(b0_reflist[6]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(44));
|
|
+
|
|
+ reg = G1_REG_BINIT_RLIST_B11(b1_reflist[11]) |
|
|
+ G1_REG_BINIT_RLIST_F11(b0_reflist[11]) |
|
|
+ G1_REG_BINIT_RLIST_B10(b1_reflist[10]) |
|
|
+ G1_REG_BINIT_RLIST_F10(b0_reflist[10]) |
|
|
+ G1_REG_BINIT_RLIST_B9(b1_reflist[9]) |
|
|
+ G1_REG_BINIT_RLIST_F9(b0_reflist[9]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(45));
|
|
+
|
|
+ reg = G1_REG_BINIT_RLIST_B14(b1_reflist[14]) |
|
|
+ G1_REG_BINIT_RLIST_F14(b0_reflist[14]) |
|
|
+ G1_REG_BINIT_RLIST_B13(b1_reflist[13]) |
|
|
+ G1_REG_BINIT_RLIST_F13(b0_reflist[13]) |
|
|
+ G1_REG_BINIT_RLIST_B12(b1_reflist[12]) |
|
|
+ G1_REG_BINIT_RLIST_F12(b0_reflist[12]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(46));
|
|
+
|
|
+ reg = G1_REG_PINIT_RLIST_F3(p_reflist[3]) |
|
|
+ G1_REG_PINIT_RLIST_F2(p_reflist[2]) |
|
|
+ G1_REG_PINIT_RLIST_F1(p_reflist[1]) |
|
|
+ G1_REG_PINIT_RLIST_F0(p_reflist[0]) |
|
|
+ G1_REG_BINIT_RLIST_B15(b1_reflist[15]) |
|
|
+ G1_REG_BINIT_RLIST_F15(b0_reflist[15]);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(47));
|
|
+
|
|
+ reg = G1_REG_STARTMB_X(0) |
|
|
+ G1_REG_STARTMB_Y(0);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(48));
|
|
+
|
|
+ reg = G1_REG_PRED_BC_TAP_0_0(1) |
|
|
+ G1_REG_PRED_BC_TAP_0_1((u32)-5) |
|
|
+ G1_REG_PRED_BC_TAP_0_2(20);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(49));
|
|
+
|
|
+ reg = G1_REG_REFBU_E(0);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(51));
|
|
+
|
|
+ reg = G1_REG_APF_THRESHOLD(8);
|
|
+ vdpu_write_relaxed(vpu, reg, G1_SWREG(55));
|
|
|
|
- /* Set up addresses of DPB buffers. */
|
|
- for (i = 0; i < HANTRO_H264_DPB_SIZE; i++) {
|
|
- dma_addr_t dma_addr = hantro_h264_get_ref_buf(ctx, i);
|
|
-
|
|
- vdpu_write_relaxed(vpu, dma_addr, G1_REG_ADDR_REF(i));
|
|
- }
|
|
-}
|
|
-
|
|
-static void set_buffers(struct hantro_ctx *ctx)
|
|
-{
|
|
- const struct hantro_h264_dec_ctrls *ctrls = &ctx->h264_dec.ctrls;
|
|
- struct vb2_v4l2_buffer *src_buf, *dst_buf;
|
|
- struct hantro_dev *vpu = ctx->dev;
|
|
- dma_addr_t src_dma, dst_dma;
|
|
- size_t offset = 0;
|
|
-
|
|
- src_buf = hantro_get_src_buf(ctx);
|
|
- dst_buf = hantro_get_dst_buf(ctx);
|
|
+ /* Auxiliary buffer prepared in hantro_g1_h264_dec_prepare_table(). */
|
|
+ vdpu_write_relaxed(vpu, ctx->h264_dec.priv.dma, G1_REG_QTABLE_BASE);
|
|
|
|
/* Source (stream) buffer. */
|
|
- src_dma = vb2_dma_contig_plane_dma_addr(&src_buf->vb2_buf, 0);
|
|
- vdpu_write_relaxed(vpu, src_dma, G1_REG_ADDR_STR);
|
|
+ addr = vb2_dma_contig_plane_dma_addr(&src_buf->vb2_buf, 0);
|
|
+ vdpu_write_relaxed(vpu, addr, G1_REG_RLC_VLC_BASE);
|
|
|
|
/* Destination (decoded frame) buffer. */
|
|
- dst_dma = hantro_get_dec_buf_addr(ctx, &dst_buf->vb2_buf);
|
|
+ addr = hantro_get_dec_buf_addr(ctx, &dst_buf->vb2_buf);
|
|
/* Adjust dma addr to start at second line for bottom field */
|
|
- if (ctrls->slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)
|
|
+ if (slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)
|
|
offset = ALIGN(ctx->src_fmt.width, MB_DIM);
|
|
- vdpu_write_relaxed(vpu, dst_dma + offset, G1_REG_ADDR_DST);
|
|
+ vdpu_write_relaxed(vpu, addr + offset, G1_REG_DEC_OUT_BASE);
|
|
|
|
/* Higher profiles require DMV buffer appended to reference frames. */
|
|
- if (ctrls->sps->profile_idc > 66 && ctrls->decode->nal_ref_idc) {
|
|
+ if (sps->profile_idc > 66 && decode->nal_ref_idc) {
|
|
unsigned int bytes_per_mb = 384;
|
|
|
|
/* DMV buffer for monochrome start directly after Y-plane */
|
|
- if (ctrls->sps->profile_idc >= 100 &&
|
|
- ctrls->sps->chroma_format_idc == 0)
|
|
+ if (sps->profile_idc >= 100 && sps->chroma_format_idc == 0)
|
|
bytes_per_mb = 256;
|
|
offset = bytes_per_mb * MB_WIDTH(ctx->src_fmt.width) *
|
|
MB_HEIGHT(ctx->src_fmt.height);
|
|
@@ -252,42 +447,32 @@ static void set_buffers(struct hantro_ctx *ctx)
|
|
* DMV buffer is split in two for field encoded frames,
|
|
* adjust offset for bottom field
|
|
*/
|
|
- if (ctrls->slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)
|
|
+ if (slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)
|
|
offset += 32 * MB_WIDTH(ctx->src_fmt.width) *
|
|
MB_HEIGHT(ctx->src_fmt.height);
|
|
- vdpu_write_relaxed(vpu, dst_dma + offset, G1_REG_ADDR_DIR_MV);
|
|
+ vdpu_write_relaxed(vpu, addr + offset, G1_REG_DIR_MV_BASE);
|
|
}
|
|
|
|
- /* Auxiliary buffer prepared in hantro_g1_h264_dec_prepare_table(). */
|
|
- vdpu_write_relaxed(vpu, ctx->h264_dec.priv.dma, G1_REG_ADDR_QTABLE);
|
|
-}
|
|
-
|
|
-void hantro_g1_h264_dec_run(struct hantro_ctx *ctx)
|
|
-{
|
|
- struct hantro_dev *vpu = ctx->dev;
|
|
-
|
|
- /* Prepare the H264 decoder context. */
|
|
- if (hantro_h264_dec_prepare_run(ctx))
|
|
- return;
|
|
-
|
|
- /* Configure hardware registers. */
|
|
- set_params(ctx);
|
|
- set_ref(ctx);
|
|
- set_buffers(ctx);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 0), G1_REG_REFER0_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 1), G1_REG_REFER1_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 2), G1_REG_REFER2_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 3), G1_REG_REFER3_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 4), G1_REG_REFER4_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 5), G1_REG_REFER5_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 6), G1_REG_REFER6_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 7), G1_REG_REFER7_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 8), G1_REG_REFER8_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 9), G1_REG_REFER9_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 10), G1_REG_REFER10_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 11), G1_REG_REFER11_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 12), G1_REG_REFER12_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 13), G1_REG_REFER13_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 14), G1_REG_REFER14_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 15), G1_REG_REFER15_BASE);
|
|
|
|
hantro_end_prepare_run(ctx);
|
|
|
|
/* Start decoding! */
|
|
- vdpu_write_relaxed(vpu,
|
|
- G1_REG_CONFIG_DEC_AXI_RD_ID(0xffu) |
|
|
- G1_REG_CONFIG_DEC_TIMEOUT_E |
|
|
- G1_REG_CONFIG_DEC_OUT_ENDIAN |
|
|
- G1_REG_CONFIG_DEC_STRENDIAN_E |
|
|
- G1_REG_CONFIG_DEC_MAX_BURST(16) |
|
|
- G1_REG_CONFIG_DEC_OUTSWAP32_E |
|
|
- G1_REG_CONFIG_DEC_INSWAP32_E |
|
|
- G1_REG_CONFIG_DEC_STRSWAP32_E |
|
|
- G1_REG_CONFIG_DEC_CLK_GATE_E,
|
|
- G1_REG_CONFIG);
|
|
- vdpu_write(vpu, G1_REG_INTERRUPT_DEC_E, G1_REG_INTERRUPT);
|
|
+ reg = G1_REG_DEC_E(1);
|
|
+ vdpu_write(vpu, reg, G1_SWREG(1));
|
|
}
|
|
diff --git a/drivers/staging/media/hantro/hantro_h264.c b/drivers/staging/media/hantro/hantro_h264.c
|
|
index 4db779354e89..2edcdda2ad63 100644
|
|
--- a/drivers/staging/media/hantro/hantro_h264.c
|
|
+++ b/drivers/staging/media/hantro/hantro_h264.c
|
|
@@ -596,6 +596,20 @@ dma_addr_t hantro_h264_get_ref_buf(struct hantro_ctx *ctx,
|
|
return dma_addr | flags;
|
|
}
|
|
|
|
+u16 hantro_h264_get_ref_nbr(struct hantro_ctx *ctx,
|
|
+ unsigned int dpb_idx)
|
|
+{
|
|
+ const struct v4l2_h264_dpb_entry *dpb = &ctx->h264_dec.dpb[dpb_idx];
|
|
+
|
|
+ if (!(dpb->flags & V4L2_H264_DPB_ENTRY_FLAG_ACTIVE))
|
|
+ return 0;
|
|
+
|
|
+ if (dpb->flags & V4L2_H264_DPB_ENTRY_FLAG_LONG_TERM)
|
|
+ return dpb->pic_num;
|
|
+
|
|
+ return dpb->frame_num;
|
|
+}
|
|
+
|
|
int hantro_h264_dec_prepare_run(struct hantro_ctx *ctx)
|
|
{
|
|
struct hantro_h264_dec_hw_ctx *h264_ctx = &ctx->h264_dec;
|
|
diff --git a/drivers/staging/media/hantro/hantro_hw.h b/drivers/staging/media/hantro/hantro_hw.h
|
|
index 3dc7b8f27c32..fadd3e1bf0d9 100644
|
|
--- a/drivers/staging/media/hantro/hantro_hw.h
|
|
+++ b/drivers/staging/media/hantro/hantro_hw.h
|
|
@@ -172,6 +172,8 @@ void hantro_jpeg_enc_exit(struct hantro_ctx *ctx);
|
|
|
|
dma_addr_t hantro_h264_get_ref_buf(struct hantro_ctx *ctx,
|
|
unsigned int dpb_idx);
|
|
+u16 hantro_h264_get_ref_nbr(struct hantro_ctx *ctx,
|
|
+ unsigned int dpb_idx);
|
|
int hantro_h264_dec_prepare_run(struct hantro_ctx *ctx);
|
|
void hantro_g1_h264_dec_run(struct hantro_ctx *ctx);
|
|
int hantro_h264_dec_init(struct hantro_ctx *ctx);
|
|
--
|
|
2.17.1
|
|
|
|
|
|
From 93fc47fb35fdbcc94bf1f1008fccffe16d7465c4 Mon Sep 17 00:00:00 2001
|
|
From: Jonas Karlman <jonas@kwiboo.se>
|
|
Date: Sun, 18 Aug 2019 10:40:31 +0000
|
|
Subject: [PATCH] media: hantro: Add support for H264 decoding on RK3399
|
|
|
|
Signed-off-by: Jonas Karlman <jonas@kwiboo.se>
|
|
---
|
|
drivers/staging/media/hantro/Makefile | 1 +
|
|
drivers/staging/media/hantro/hantro_hw.h | 1 +
|
|
.../media/hantro/rk3399_vpu_hw_h264_dec.c | 493 ++++++++++++++++++
|
|
3 files changed, 495 insertions(+)
|
|
create mode 100644 drivers/staging/media/hantro/rk3399_vpu_hw_h264_dec.c
|
|
|
|
diff --git a/drivers/staging/media/hantro/Makefile b/drivers/staging/media/hantro/Makefile
|
|
index 496b30c3c396..9bb8a560cb0a 100644
|
|
--- a/drivers/staging/media/hantro/Makefile
|
|
+++ b/drivers/staging/media/hantro/Makefile
|
|
@@ -9,6 +9,7 @@ hantro-vpu-y += \
|
|
hantro_g1_mpeg2_dec.o \
|
|
hantro_g1_vp8_dec.o \
|
|
rk3399_vpu_hw_jpeg_enc.o \
|
|
+ rk3399_vpu_hw_h264_dec.o \
|
|
rk3399_vpu_hw_mpeg2_dec.o \
|
|
rk3399_vpu_hw_vp8_dec.o \
|
|
hantro_jpeg.o \
|
|
diff --git a/drivers/staging/media/hantro/hantro_hw.h b/drivers/staging/media/hantro/hantro_hw.h
|
|
index fadd3e1bf0d9..4a64873bf332 100644
|
|
--- a/drivers/staging/media/hantro/hantro_hw.h
|
|
+++ b/drivers/staging/media/hantro/hantro_hw.h
|
|
@@ -176,6 +176,7 @@ u16 hantro_h264_get_ref_nbr(struct hantro_ctx *ctx,
|
|
unsigned int dpb_idx);
|
|
int hantro_h264_dec_prepare_run(struct hantro_ctx *ctx);
|
|
void hantro_g1_h264_dec_run(struct hantro_ctx *ctx);
|
|
+void rk3399_vpu_h264_dec_run(struct hantro_ctx *ctx);
|
|
int hantro_h264_dec_init(struct hantro_ctx *ctx);
|
|
void hantro_h264_dec_exit(struct hantro_ctx *ctx);
|
|
|
|
diff --git a/drivers/staging/media/hantro/rk3399_vpu_hw_h264_dec.c b/drivers/staging/media/hantro/rk3399_vpu_hw_h264_dec.c
|
|
new file mode 100644
|
|
index 000000000000..1f9de7d5a923
|
|
--- /dev/null
|
|
+++ b/drivers/staging/media/hantro/rk3399_vpu_hw_h264_dec.c
|
|
@@ -0,0 +1,493 @@
|
|
+// SPDX-License-Identifier: GPL-2.0
|
|
+/*
|
|
+ * Hantro VPU codec driver
|
|
+ *
|
|
+ * Copyright (c) 2014 Rockchip Electronics Co., Ltd.
|
|
+ * Hertz Wong <hertz.wong@rock-chips.com>
|
|
+ * Herman Chen <herman.chen@rock-chips.com>
|
|
+ *
|
|
+ * Copyright (C) 2014 Google, Inc.
|
|
+ * Tomasz Figa <tfiga@chromium.org>
|
|
+ */
|
|
+
|
|
+#include <linux/types.h>
|
|
+#include <linux/sort.h>
|
|
+
|
|
+#include <media/v4l2-mem2mem.h>
|
|
+
|
|
+#include "hantro_hw.h"
|
|
+#include "hantro_v4l2.h"
|
|
+
|
|
+#define VDPU_SWREG(nr) ((nr) * 4)
|
|
+
|
|
+#define VDPU_REG_DEC_OUT_BASE VDPU_SWREG(63)
|
|
+#define VDPU_REG_RLC_VLC_BASE VDPU_SWREG(64)
|
|
+#define VDPU_REG_QTABLE_BASE VDPU_SWREG(61)
|
|
+#define VDPU_REG_DIR_MV_BASE VDPU_SWREG(62)
|
|
+#define VDPU_REG_REFER0_BASE VDPU_SWREG(84)
|
|
+#define VDPU_REG_REFER1_BASE VDPU_SWREG(85)
|
|
+#define VDPU_REG_REFER2_BASE VDPU_SWREG(86)
|
|
+#define VDPU_REG_REFER3_BASE VDPU_SWREG(87)
|
|
+#define VDPU_REG_REFER4_BASE VDPU_SWREG(88)
|
|
+#define VDPU_REG_REFER5_BASE VDPU_SWREG(89)
|
|
+#define VDPU_REG_REFER6_BASE VDPU_SWREG(90)
|
|
+#define VDPU_REG_REFER7_BASE VDPU_SWREG(91)
|
|
+#define VDPU_REG_REFER8_BASE VDPU_SWREG(92)
|
|
+#define VDPU_REG_REFER9_BASE VDPU_SWREG(93)
|
|
+#define VDPU_REG_REFER10_BASE VDPU_SWREG(94)
|
|
+#define VDPU_REG_REFER11_BASE VDPU_SWREG(95)
|
|
+#define VDPU_REG_REFER12_BASE VDPU_SWREG(96)
|
|
+#define VDPU_REG_REFER13_BASE VDPU_SWREG(97)
|
|
+#define VDPU_REG_REFER14_BASE VDPU_SWREG(98)
|
|
+#define VDPU_REG_REFER15_BASE VDPU_SWREG(99)
|
|
+#define VDPU_REG_DEC_E(v) ((v) ? BIT(0) : 0)
|
|
+
|
|
+#define VDPU_REG_DEC_ADV_PRE_DIS(v) ((v) ? BIT(11) : 0)
|
|
+#define VDPU_REG_DEC_SCMD_DIS(v) ((v) ? BIT(10) : 0)
|
|
+#define VDPU_REG_FILTERING_DIS(v) ((v) ? BIT(8) : 0)
|
|
+#define VDPU_REG_PIC_FIXED_QUANT(v) ((v) ? BIT(7) : 0)
|
|
+#define VDPU_REG_DEC_LATENCY(v) (((v) << 1) & GENMASK(6, 1))
|
|
+
|
|
+#define VDPU_REG_INIT_QP(v) (((v) << 25) & GENMASK(30, 25))
|
|
+#define VDPU_REG_STREAM_LEN(v) (((v) << 0) & GENMASK(23, 0))
|
|
+
|
|
+#define VDPU_REG_APF_THRESHOLD(v) (((v) << 17) & GENMASK(30, 17))
|
|
+#define VDPU_REG_STARTMB_X(v) (((v) << 8) & GENMASK(16, 8))
|
|
+#define VDPU_REG_STARTMB_Y(v) (((v) << 0) & GENMASK(7, 0))
|
|
+
|
|
+#define VDPU_REG_DEC_MODE(v) (((v) << 0) & GENMASK(3, 0))
|
|
+
|
|
+#define VDPU_REG_DEC_STRENDIAN_E(v) ((v) ? BIT(5) : 0)
|
|
+#define VDPU_REG_DEC_STRSWAP32_E(v) ((v) ? BIT(4) : 0)
|
|
+#define VDPU_REG_DEC_OUTSWAP32_E(v) ((v) ? BIT(3) : 0)
|
|
+#define VDPU_REG_DEC_INSWAP32_E(v) ((v) ? BIT(2) : 0)
|
|
+#define VDPU_REG_DEC_OUT_ENDIAN(v) ((v) ? BIT(1) : 0)
|
|
+#define VDPU_REG_DEC_IN_ENDIAN(v) ((v) ? BIT(0) : 0)
|
|
+
|
|
+#define VDPU_REG_DEC_DATA_DISC_E(v) ((v) ? BIT(22) : 0)
|
|
+#define VDPU_REG_DEC_MAX_BURST(v) (((v) << 16) & GENMASK(20, 16))
|
|
+#define VDPU_REG_DEC_AXI_WR_ID(v) (((v) << 8) & GENMASK(15, 8))
|
|
+#define VDPU_REG_DEC_AXI_RD_ID(v) (((v) << 0) & GENMASK(7, 0))
|
|
+
|
|
+#define VDPU_REG_START_CODE_E(v) ((v) ? BIT(22) : 0)
|
|
+#define VDPU_REG_CH_8PIX_ILEAV_E(v) ((v) ? BIT(21) : 0)
|
|
+#define VDPU_REG_RLC_MODE_E(v) ((v) ? BIT(20) : 0)
|
|
+#define VDPU_REG_PIC_INTERLACE_E(v) ((v) ? BIT(17) : 0)
|
|
+#define VDPU_REG_PIC_FIELDMODE_E(v) ((v) ? BIT(16) : 0)
|
|
+#define VDPU_REG_PIC_TOPFIELD_E(v) ((v) ? BIT(13) : 0)
|
|
+#define VDPU_REG_WRITE_MVS_E(v) ((v) ? BIT(10) : 0)
|
|
+#define VDPU_REG_SEQ_MBAFF_E(v) ((v) ? BIT(7) : 0)
|
|
+#define VDPU_REG_PICORD_COUNT_E(v) ((v) ? BIT(6) : 0)
|
|
+#define VDPU_REG_DEC_TIMEOUT_E(v) ((v) ? BIT(5) : 0)
|
|
+#define VDPU_REG_DEC_CLK_GATE_E(v) ((v) ? BIT(4) : 0)
|
|
+
|
|
+#define VDPU_REG_PRED_BC_TAP_0_0(v) (((v) << 22) & GENMASK(31, 22))
|
|
+#define VDPU_REG_PRED_BC_TAP_0_1(v) (((v) << 12) & GENMASK(21, 12))
|
|
+#define VDPU_REG_PRED_BC_TAP_0_2(v) (((v) << 2) & GENMASK(11, 2))
|
|
+
|
|
+#define VDPU_REG_REFBU_E(v) ((v) ? BIT(31) : 0)
|
|
+
|
|
+#define VDPU_REG_PINIT_RLIST_F9(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define VDPU_REG_PINIT_RLIST_F8(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define VDPU_REG_PINIT_RLIST_F7(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_PINIT_RLIST_F6(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_PINIT_RLIST_F5(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_PINIT_RLIST_F4(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_PINIT_RLIST_F15(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define VDPU_REG_PINIT_RLIST_F14(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define VDPU_REG_PINIT_RLIST_F13(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_PINIT_RLIST_F12(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_PINIT_RLIST_F11(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_PINIT_RLIST_F10(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_REFER1_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER0_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFER3_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER2_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFER5_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER4_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFER7_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER6_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFER9_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER8_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFER11_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER10_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFER13_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER12_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFER15_NBR(v) (((v) << 16) & GENMASK(31, 16))
|
|
+#define VDPU_REG_REFER14_NBR(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_BINIT_RLIST_F5(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define VDPU_REG_BINIT_RLIST_F4(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define VDPU_REG_BINIT_RLIST_F3(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_BINIT_RLIST_F2(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_BINIT_RLIST_F1(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_BINIT_RLIST_F0(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_BINIT_RLIST_F11(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define VDPU_REG_BINIT_RLIST_F10(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define VDPU_REG_BINIT_RLIST_F9(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_BINIT_RLIST_F8(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_BINIT_RLIST_F7(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_BINIT_RLIST_F6(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_BINIT_RLIST_F15(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_BINIT_RLIST_F14(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_BINIT_RLIST_F13(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_BINIT_RLIST_F12(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_BINIT_RLIST_B5(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define VDPU_REG_BINIT_RLIST_B4(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define VDPU_REG_BINIT_RLIST_B3(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_BINIT_RLIST_B2(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_BINIT_RLIST_B1(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_BINIT_RLIST_B0(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_BINIT_RLIST_B11(v) (((v) << 25) & GENMASK(29, 25))
|
|
+#define VDPU_REG_BINIT_RLIST_B10(v) (((v) << 20) & GENMASK(24, 20))
|
|
+#define VDPU_REG_BINIT_RLIST_B9(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_BINIT_RLIST_B8(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_BINIT_RLIST_B7(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_BINIT_RLIST_B6(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_BINIT_RLIST_B15(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_BINIT_RLIST_B14(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_BINIT_RLIST_B13(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_BINIT_RLIST_B12(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_PINIT_RLIST_F3(v) (((v) << 15) & GENMASK(19, 15))
|
|
+#define VDPU_REG_PINIT_RLIST_F2(v) (((v) << 10) & GENMASK(14, 10))
|
|
+#define VDPU_REG_PINIT_RLIST_F1(v) (((v) << 5) & GENMASK(9, 5))
|
|
+#define VDPU_REG_PINIT_RLIST_F0(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_REFER_LTERM_E(v) (((v) << 0) & GENMASK(31, 0))
|
|
+
|
|
+#define VDPU_REG_REFER_VALID_E(v) (((v) << 0) & GENMASK(31, 0))
|
|
+
|
|
+#define VDPU_REG_STRM_START_BIT(v) (((v) << 0) & GENMASK(5, 0))
|
|
+
|
|
+#define VDPU_REG_CH_QP_OFFSET2(v) (((v) << 22) & GENMASK(26, 22))
|
|
+#define VDPU_REG_CH_QP_OFFSET(v) (((v) << 17) & GENMASK(21, 17))
|
|
+#define VDPU_REG_PIC_MB_HEIGHT_P(v) (((v) << 9) & GENMASK(16, 9))
|
|
+#define VDPU_REG_PIC_MB_WIDTH(v) (((v) << 0) & GENMASK(8, 0))
|
|
+
|
|
+#define VDPU_REG_WEIGHT_BIPR_IDC(v) (((v) << 16) & GENMASK(17, 16))
|
|
+#define VDPU_REG_REF_FRAMES(v) (((v) << 0) & GENMASK(4, 0))
|
|
+
|
|
+#define VDPU_REG_FILT_CTRL_PRES(v) ((v) ? BIT(31) : 0)
|
|
+#define VDPU_REG_RDPIC_CNT_PRES(v) ((v) ? BIT(30) : 0)
|
|
+#define VDPU_REG_FRAMENUM_LEN(v) (((v) << 16) & GENMASK(20, 16))
|
|
+#define VDPU_REG_FRAMENUM(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_REFPIC_MK_LEN(v) (((v) << 16) & GENMASK(26, 16))
|
|
+#define VDPU_REG_IDR_PIC_ID(v) (((v) << 0) & GENMASK(15, 0))
|
|
+
|
|
+#define VDPU_REG_PPS_ID(v) (((v) << 24) & GENMASK(31, 24))
|
|
+#define VDPU_REG_REFIDX1_ACTIVE(v) (((v) << 19) & GENMASK(23, 19))
|
|
+#define VDPU_REG_REFIDX0_ACTIVE(v) (((v) << 14) & GENMASK(18, 14))
|
|
+#define VDPU_REG_POC_LENGTH(v) (((v) << 0) & GENMASK(7, 0))
|
|
+
|
|
+#define VDPU_REG_IDR_PIC_E(v) ((v) ? BIT(8) : 0)
|
|
+#define VDPU_REG_DIR_8X8_INFER_E(v) ((v) ? BIT(7) : 0)
|
|
+#define VDPU_REG_BLACKWHITE_E(v) ((v) ? BIT(6) : 0)
|
|
+#define VDPU_REG_CABAC_E(v) ((v) ? BIT(5) : 0)
|
|
+#define VDPU_REG_WEIGHT_PRED_E(v) ((v) ? BIT(4) : 0)
|
|
+#define VDPU_REG_CONST_INTRA_E(v) ((v) ? BIT(3) : 0)
|
|
+#define VDPU_REG_8X8TRANS_FLAG_E(v) ((v) ? BIT(2) : 0)
|
|
+#define VDPU_REG_TYPE1_QUANT_E(v) ((v) ? BIT(1) : 0)
|
|
+#define VDPU_REG_FIELDPIC_FLAG_E(v) ((v) ? BIT(0) : 0)
|
|
+
|
|
+void rk3399_vpu_h264_dec_run(struct hantro_ctx *ctx)
|
|
+{
|
|
+ struct hantro_dev *vpu = ctx->dev;
|
|
+ struct vb2_v4l2_buffer *src_buf, *dst_buf;
|
|
+ const struct hantro_h264_dec_ctrls *ctrls;
|
|
+ const struct v4l2_ctrl_h264_decode_params *decode;
|
|
+ const struct v4l2_ctrl_h264_slice_params *slices;
|
|
+ const struct v4l2_ctrl_h264_sps *sps;
|
|
+ const struct v4l2_ctrl_h264_pps *pps;
|
|
+ const u8 *b0_reflist, *b1_reflist, *p_reflist;
|
|
+ dma_addr_t addr;
|
|
+ size_t offset = 0;
|
|
+ u32 reg;
|
|
+
|
|
+ /* Prepare the H264 decoder context. */
|
|
+ if (hantro_h264_dec_prepare_run(ctx))
|
|
+ return;
|
|
+
|
|
+ src_buf = hantro_get_src_buf(ctx);
|
|
+ dst_buf = hantro_get_dst_buf(ctx);
|
|
+
|
|
+ ctrls = &ctx->h264_dec.ctrls;
|
|
+ decode = ctrls->decode;
|
|
+ slices = ctrls->slices;
|
|
+ sps = ctrls->sps;
|
|
+ pps = ctrls->pps;
|
|
+
|
|
+ b0_reflist = ctx->h264_dec.reflists.b0;
|
|
+ b1_reflist = ctx->h264_dec.reflists.b1;
|
|
+ p_reflist = ctx->h264_dec.reflists.p;
|
|
+
|
|
+ reg = VDPU_REG_DEC_ADV_PRE_DIS(0) |
|
|
+ VDPU_REG_DEC_SCMD_DIS(0) |
|
|
+ VDPU_REG_FILTERING_DIS(0) |
|
|
+ VDPU_REG_PIC_FIXED_QUANT(0) |
|
|
+ VDPU_REG_DEC_LATENCY(0);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(50));
|
|
+
|
|
+ reg = VDPU_REG_INIT_QP(pps->pic_init_qp_minus26 + 26) |
|
|
+ VDPU_REG_STREAM_LEN(vb2_get_plane_payload(&src_buf->vb2_buf, 0));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(51));
|
|
+
|
|
+ reg = VDPU_REG_APF_THRESHOLD(8) |
|
|
+ VDPU_REG_STARTMB_X(0) |
|
|
+ VDPU_REG_STARTMB_Y(0);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(52));
|
|
+
|
|
+ reg = VDPU_REG_DEC_MODE(0);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(53));
|
|
+
|
|
+ reg = VDPU_REG_DEC_STRENDIAN_E(1) |
|
|
+ VDPU_REG_DEC_STRSWAP32_E(1) |
|
|
+ VDPU_REG_DEC_OUTSWAP32_E(1) |
|
|
+ VDPU_REG_DEC_INSWAP32_E(1) |
|
|
+ VDPU_REG_DEC_OUT_ENDIAN(1) |
|
|
+ VDPU_REG_DEC_IN_ENDIAN(0);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(54));
|
|
+
|
|
+ reg = VDPU_REG_DEC_DATA_DISC_E(0) |
|
|
+ VDPU_REG_DEC_MAX_BURST(16) |
|
|
+ VDPU_REG_DEC_AXI_WR_ID(0) |
|
|
+ VDPU_REG_DEC_AXI_RD_ID(0xff);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(56));
|
|
+
|
|
+ reg = VDPU_REG_START_CODE_E(1) |
|
|
+ VDPU_REG_CH_8PIX_ILEAV_E(0) |
|
|
+ VDPU_REG_RLC_MODE_E(0) |
|
|
+ VDPU_REG_PIC_INTERLACE_E(!(sps->flags & V4L2_H264_SPS_FLAG_FRAME_MBS_ONLY) && (sps->flags & V4L2_H264_SPS_FLAG_MB_ADAPTIVE_FRAME_FIELD || slices[0].flags & V4L2_H264_SLICE_FLAG_FIELD_PIC)) |
|
|
+ VDPU_REG_PIC_FIELDMODE_E(slices[0].flags & V4L2_H264_SLICE_FLAG_FIELD_PIC) |
|
|
+ VDPU_REG_PIC_TOPFIELD_E(!(slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)) |
|
|
+ VDPU_REG_WRITE_MVS_E(sps->profile_idc > 66 && decode->nal_ref_idc) |
|
|
+ VDPU_REG_SEQ_MBAFF_E(sps->flags & V4L2_H264_SPS_FLAG_MB_ADAPTIVE_FRAME_FIELD) |
|
|
+ VDPU_REG_PICORD_COUNT_E(sps->profile_idc > 66) |
|
|
+ VDPU_REG_DEC_TIMEOUT_E(1) |
|
|
+ VDPU_REG_DEC_CLK_GATE_E(1);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(57));
|
|
+
|
|
+ reg = VDPU_REG_PRED_BC_TAP_0_0(1) |
|
|
+ VDPU_REG_PRED_BC_TAP_0_1((u32)-5) |
|
|
+ VDPU_REG_PRED_BC_TAP_0_2(20);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(59));
|
|
+
|
|
+ reg = VDPU_REG_REFBU_E(0);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(65));
|
|
+
|
|
+ reg = VDPU_REG_PINIT_RLIST_F9(p_reflist[9]) |
|
|
+ VDPU_REG_PINIT_RLIST_F8(p_reflist[8]) |
|
|
+ VDPU_REG_PINIT_RLIST_F7(p_reflist[7]) |
|
|
+ VDPU_REG_PINIT_RLIST_F6(p_reflist[6]) |
|
|
+ VDPU_REG_PINIT_RLIST_F5(p_reflist[5]) |
|
|
+ VDPU_REG_PINIT_RLIST_F4(p_reflist[4]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(74));
|
|
+
|
|
+ reg = VDPU_REG_PINIT_RLIST_F15(p_reflist[15]) |
|
|
+ VDPU_REG_PINIT_RLIST_F14(p_reflist[14]) |
|
|
+ VDPU_REG_PINIT_RLIST_F13(p_reflist[13]) |
|
|
+ VDPU_REG_PINIT_RLIST_F12(p_reflist[12]) |
|
|
+ VDPU_REG_PINIT_RLIST_F11(p_reflist[11]) |
|
|
+ VDPU_REG_PINIT_RLIST_F10(p_reflist[10]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(75));
|
|
+
|
|
+ reg = VDPU_REG_REFER1_NBR(hantro_h264_get_ref_nbr(ctx, 1)) |
|
|
+ VDPU_REG_REFER0_NBR(hantro_h264_get_ref_nbr(ctx, 0));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(76));
|
|
+
|
|
+ reg = VDPU_REG_REFER3_NBR(hantro_h264_get_ref_nbr(ctx, 3)) |
|
|
+ VDPU_REG_REFER2_NBR(hantro_h264_get_ref_nbr(ctx, 2));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(77));
|
|
+
|
|
+ reg = VDPU_REG_REFER5_NBR(hantro_h264_get_ref_nbr(ctx, 5)) |
|
|
+ VDPU_REG_REFER4_NBR(hantro_h264_get_ref_nbr(ctx, 4));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(78));
|
|
+
|
|
+ reg = VDPU_REG_REFER7_NBR(hantro_h264_get_ref_nbr(ctx, 7)) |
|
|
+ VDPU_REG_REFER6_NBR(hantro_h264_get_ref_nbr(ctx, 6));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(79));
|
|
+
|
|
+ reg = VDPU_REG_REFER9_NBR(hantro_h264_get_ref_nbr(ctx, 9)) |
|
|
+ VDPU_REG_REFER8_NBR(hantro_h264_get_ref_nbr(ctx, 8));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(80));
|
|
+
|
|
+ reg = VDPU_REG_REFER11_NBR(hantro_h264_get_ref_nbr(ctx, 11)) |
|
|
+ VDPU_REG_REFER10_NBR(hantro_h264_get_ref_nbr(ctx, 10));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(81));
|
|
+
|
|
+ reg = VDPU_REG_REFER13_NBR(hantro_h264_get_ref_nbr(ctx, 13)) |
|
|
+ VDPU_REG_REFER12_NBR(hantro_h264_get_ref_nbr(ctx, 12));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(82));
|
|
+
|
|
+ reg = VDPU_REG_REFER15_NBR(hantro_h264_get_ref_nbr(ctx, 15)) |
|
|
+ VDPU_REG_REFER14_NBR(hantro_h264_get_ref_nbr(ctx, 14));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(83));
|
|
+
|
|
+ reg = VDPU_REG_BINIT_RLIST_F5(b0_reflist[5]) |
|
|
+ VDPU_REG_BINIT_RLIST_F4(b0_reflist[4]) |
|
|
+ VDPU_REG_BINIT_RLIST_F3(b0_reflist[3]) |
|
|
+ VDPU_REG_BINIT_RLIST_F2(b0_reflist[2]) |
|
|
+ VDPU_REG_BINIT_RLIST_F1(b0_reflist[1]) |
|
|
+ VDPU_REG_BINIT_RLIST_F0(b0_reflist[0]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(100));
|
|
+
|
|
+ reg = VDPU_REG_BINIT_RLIST_F11(b0_reflist[11]) |
|
|
+ VDPU_REG_BINIT_RLIST_F10(b0_reflist[10]) |
|
|
+ VDPU_REG_BINIT_RLIST_F9(b0_reflist[9]) |
|
|
+ VDPU_REG_BINIT_RLIST_F8(b0_reflist[8]) |
|
|
+ VDPU_REG_BINIT_RLIST_F7(b0_reflist[7]) |
|
|
+ VDPU_REG_BINIT_RLIST_F6(b0_reflist[6]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(101));
|
|
+
|
|
+ reg = VDPU_REG_BINIT_RLIST_F15(b0_reflist[15]) |
|
|
+ VDPU_REG_BINIT_RLIST_F14(b0_reflist[14]) |
|
|
+ VDPU_REG_BINIT_RLIST_F13(b0_reflist[13]) |
|
|
+ VDPU_REG_BINIT_RLIST_F12(b0_reflist[12]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(102));
|
|
+
|
|
+ reg = VDPU_REG_BINIT_RLIST_B5(b1_reflist[5]) |
|
|
+ VDPU_REG_BINIT_RLIST_B4(b1_reflist[4]) |
|
|
+ VDPU_REG_BINIT_RLIST_B3(b1_reflist[3]) |
|
|
+ VDPU_REG_BINIT_RLIST_B2(b1_reflist[2]) |
|
|
+ VDPU_REG_BINIT_RLIST_B1(b1_reflist[1]) |
|
|
+ VDPU_REG_BINIT_RLIST_B0(b1_reflist[0]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(103));
|
|
+
|
|
+ reg = VDPU_REG_BINIT_RLIST_B11(b1_reflist[11]) |
|
|
+ VDPU_REG_BINIT_RLIST_B10(b1_reflist[10]) |
|
|
+ VDPU_REG_BINIT_RLIST_B9(b1_reflist[9]) |
|
|
+ VDPU_REG_BINIT_RLIST_B8(b1_reflist[8]) |
|
|
+ VDPU_REG_BINIT_RLIST_B7(b1_reflist[7]) |
|
|
+ VDPU_REG_BINIT_RLIST_B6(b1_reflist[6]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(104));
|
|
+
|
|
+ reg = VDPU_REG_BINIT_RLIST_B15(b1_reflist[15]) |
|
|
+ VDPU_REG_BINIT_RLIST_B14(b1_reflist[14]) |
|
|
+ VDPU_REG_BINIT_RLIST_B13(b1_reflist[13]) |
|
|
+ VDPU_REG_BINIT_RLIST_B12(b1_reflist[12]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(105));
|
|
+
|
|
+ reg = VDPU_REG_PINIT_RLIST_F3(p_reflist[3]) |
|
|
+ VDPU_REG_PINIT_RLIST_F2(p_reflist[2]) |
|
|
+ VDPU_REG_PINIT_RLIST_F1(p_reflist[1]) |
|
|
+ VDPU_REG_PINIT_RLIST_F0(p_reflist[0]);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(106));
|
|
+
|
|
+ reg = VDPU_REG_REFER_LTERM_E(ctx->h264_dec.dpb_longterm);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(107));
|
|
+
|
|
+ reg = VDPU_REG_REFER_VALID_E(ctx->h264_dec.dpb_valid);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(108));
|
|
+
|
|
+ reg = VDPU_REG_STRM_START_BIT(0);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(109));
|
|
+
|
|
+ reg = VDPU_REG_CH_QP_OFFSET2(pps->second_chroma_qp_index_offset) |
|
|
+ VDPU_REG_CH_QP_OFFSET(pps->chroma_qp_index_offset) |
|
|
+ VDPU_REG_PIC_MB_HEIGHT_P(MB_HEIGHT(ctx->src_fmt.height)) |
|
|
+ VDPU_REG_PIC_MB_WIDTH(MB_WIDTH(ctx->src_fmt.width));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(110));
|
|
+
|
|
+ reg = VDPU_REG_WEIGHT_BIPR_IDC(pps->weighted_bipred_idc) |
|
|
+ VDPU_REG_REF_FRAMES(sps->max_num_ref_frames);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(111));
|
|
+
|
|
+ reg = VDPU_REG_FILT_CTRL_PRES(pps->flags & V4L2_H264_PPS_FLAG_DEBLOCKING_FILTER_CONTROL_PRESENT) |
|
|
+ VDPU_REG_RDPIC_CNT_PRES(pps->flags & V4L2_H264_PPS_FLAG_REDUNDANT_PIC_CNT_PRESENT) |
|
|
+ VDPU_REG_FRAMENUM_LEN(sps->log2_max_frame_num_minus4 + 4) |
|
|
+ VDPU_REG_FRAMENUM(slices[0].frame_num);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(112));
|
|
+
|
|
+ reg = VDPU_REG_REFPIC_MK_LEN(slices[0].dec_ref_pic_marking_bit_size) |
|
|
+ VDPU_REG_IDR_PIC_ID(slices[0].idr_pic_id);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(113));
|
|
+
|
|
+ reg = VDPU_REG_PPS_ID(slices[0].pic_parameter_set_id) |
|
|
+ VDPU_REG_REFIDX1_ACTIVE(pps->num_ref_idx_l1_default_active_minus1 + 1) |
|
|
+ VDPU_REG_REFIDX0_ACTIVE(pps->num_ref_idx_l0_default_active_minus1 + 1) |
|
|
+ VDPU_REG_POC_LENGTH(slices[0].pic_order_cnt_bit_size);
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(114));
|
|
+
|
|
+ reg = VDPU_REG_IDR_PIC_E(decode->flags & V4L2_H264_DECODE_PARAM_FLAG_IDR_PIC) |
|
|
+ VDPU_REG_DIR_8X8_INFER_E(sps->flags & V4L2_H264_SPS_FLAG_DIRECT_8X8_INFERENCE) |
|
|
+ VDPU_REG_BLACKWHITE_E(sps->profile_idc >= 100 && sps->chroma_format_idc == 0) |
|
|
+ VDPU_REG_CABAC_E(pps->flags & V4L2_H264_PPS_FLAG_ENTROPY_CODING_MODE) |
|
|
+ VDPU_REG_WEIGHT_PRED_E(pps->flags & V4L2_H264_PPS_FLAG_WEIGHTED_PRED) |
|
|
+ VDPU_REG_CONST_INTRA_E(pps->flags & V4L2_H264_PPS_FLAG_CONSTRAINED_INTRA_PRED) |
|
|
+ VDPU_REG_8X8TRANS_FLAG_E(pps->flags & V4L2_H264_PPS_FLAG_TRANSFORM_8X8_MODE) |
|
|
+ VDPU_REG_TYPE1_QUANT_E(1) |
|
|
+ VDPU_REG_FIELDPIC_FLAG_E(!(sps->flags & V4L2_H264_SPS_FLAG_FRAME_MBS_ONLY));
|
|
+ vdpu_write_relaxed(vpu, reg, VDPU_SWREG(115));
|
|
+
|
|
+ /* Auxiliary buffer prepared in hantro_g1_h264_dec_prepare_table(). */
|
|
+ vdpu_write_relaxed(vpu, ctx->h264_dec.priv.dma, VDPU_REG_QTABLE_BASE);
|
|
+
|
|
+ /* Source (stream) buffer. */
|
|
+ addr = vb2_dma_contig_plane_dma_addr(&src_buf->vb2_buf, 0);
|
|
+ vdpu_write_relaxed(vpu, addr, VDPU_REG_RLC_VLC_BASE);
|
|
+
|
|
+ /* Destination (decoded frame) buffer. */
|
|
+ addr = hantro_get_dec_buf_addr(ctx, &dst_buf->vb2_buf);
|
|
+ /* Adjust dma addr to start at second line for bottom field */
|
|
+ if (slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)
|
|
+ offset = ALIGN(ctx->src_fmt.width, MB_DIM);
|
|
+ vdpu_write_relaxed(vpu, addr + offset, VDPU_REG_DEC_OUT_BASE);
|
|
+
|
|
+ /* Higher profiles require DMV buffer appended to reference frames. */
|
|
+ if (sps->profile_idc > 66 && decode->nal_ref_idc) {
|
|
+ unsigned int bytes_per_mb = 384;
|
|
+
|
|
+ /* DMV buffer for monochrome start directly after Y-plane */
|
|
+ if (sps->profile_idc >= 100 && sps->chroma_format_idc == 0)
|
|
+ bytes_per_mb = 256;
|
|
+ offset = bytes_per_mb * MB_WIDTH(ctx->src_fmt.width) *
|
|
+ MB_HEIGHT(ctx->src_fmt.height);
|
|
+
|
|
+ /*
|
|
+ * DMV buffer is split in two for field encoded frames,
|
|
+ * adjust offset for bottom field
|
|
+ */
|
|
+ if (slices[0].flags & V4L2_H264_SLICE_FLAG_BOTTOM_FIELD)
|
|
+ offset += 32 * MB_WIDTH(ctx->src_fmt.width) *
|
|
+ MB_HEIGHT(ctx->src_fmt.height);
|
|
+ vdpu_write_relaxed(vpu, addr + offset, VDPU_REG_DIR_MV_BASE);
|
|
+ }
|
|
+
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 0), VDPU_REG_REFER0_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 1), VDPU_REG_REFER1_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 2), VDPU_REG_REFER2_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 3), VDPU_REG_REFER3_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 4), VDPU_REG_REFER4_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 5), VDPU_REG_REFER5_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 6), VDPU_REG_REFER6_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 7), VDPU_REG_REFER7_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 8), VDPU_REG_REFER8_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 9), VDPU_REG_REFER9_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 10), VDPU_REG_REFER10_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 11), VDPU_REG_REFER11_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 12), VDPU_REG_REFER12_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 13), VDPU_REG_REFER13_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 14), VDPU_REG_REFER14_BASE);
|
|
+ vdpu_write_relaxed(vpu, hantro_h264_get_ref_buf(ctx, 15), VDPU_REG_REFER15_BASE);
|
|
+
|
|
+ hantro_end_prepare_run(ctx);
|
|
+
|
|
+ /* Start decoding! */
|
|
+ reg = vdpu_read(vpu, VDPU_SWREG(57)) | VDPU_REG_DEC_E(1);
|
|
+ vdpu_write(vpu, reg, VDPU_SWREG(57));
|
|
+}
|
|
--
|
|
2.17.1
|
|
|
|
|
|
From c6ad44bc8c4de5b6e468ee4449bfa181ff564f5a Mon Sep 17 00:00:00 2001
|
|
From: Jonas Karlman <jonas@kwiboo.se>
|
|
Date: Sun, 18 Aug 2019 10:40:31 +0000
|
|
Subject: [PATCH] media: hantro: Enable H264 decoding on RK3399
|
|
|
|
Signed-off-by: Jonas Karlman <jonas@kwiboo.se>
|
|
---
|
|
drivers/staging/media/hantro/rk3399_vpu_hw.c | 21 +++++++++++++++++++-
|
|
1 file changed, 20 insertions(+), 1 deletion(-)
|
|
|
|
diff --git a/drivers/staging/media/hantro/rk3399_vpu_hw.c b/drivers/staging/media/hantro/rk3399_vpu_hw.c
|
|
index 9ac1f2cb6a16..3e05cd2c870e 100644
|
|
--- a/drivers/staging/media/hantro/rk3399_vpu_hw.c
|
|
+++ b/drivers/staging/media/hantro/rk3399_vpu_hw.c
|
|
@@ -60,6 +60,19 @@ static const struct hantro_fmt rk3399_vpu_dec_fmts[] = {
|
|
.fourcc = V4L2_PIX_FMT_NV12,
|
|
.codec_mode = HANTRO_MODE_NONE,
|
|
},
|
|
+ {
|
|
+ .fourcc = V4L2_PIX_FMT_H264_SLICE,
|
|
+ .codec_mode = HANTRO_MODE_H264_DEC,
|
|
+ .max_depth = 2,
|
|
+ .frmsize = {
|
|
+ .min_width = 48,
|
|
+ .max_width = 1920,
|
|
+ .step_width = MB_DIM,
|
|
+ .min_height = 48,
|
|
+ .max_height = 1088,
|
|
+ .step_height = MB_DIM,
|
|
+ },
|
|
+ },
|
|
{
|
|
.fourcc = V4L2_PIX_FMT_MPEG2_SLICE,
|
|
.codec_mode = HANTRO_MODE_MPEG2_DEC,
|
|
@@ -161,6 +174,12 @@ static const struct hantro_codec_ops rk3399_vpu_codec_ops[] = {
|
|
.init = hantro_jpeg_enc_init,
|
|
.exit = hantro_jpeg_enc_exit,
|
|
},
|
|
+ [HANTRO_MODE_H264_DEC] = {
|
|
+ .run = rk3399_vpu_h264_dec_run,
|
|
+ .reset = rk3399_vpu_dec_reset,
|
|
+ .init = hantro_h264_dec_init,
|
|
+ .exit = hantro_h264_dec_exit,
|
|
+ },
|
|
[HANTRO_MODE_MPEG2_DEC] = {
|
|
.run = rk3399_vpu_mpeg2_dec_run,
|
|
.reset = rk3399_vpu_dec_reset,
|
|
@@ -196,7 +215,7 @@ const struct hantro_variant rk3399_vpu_variant = {
|
|
.dec_fmts = rk3399_vpu_dec_fmts,
|
|
.num_dec_fmts = ARRAY_SIZE(rk3399_vpu_dec_fmts),
|
|
.codec = HANTRO_JPEG_ENCODER | HANTRO_MPEG2_DECODER |
|
|
- HANTRO_VP8_DECODER,
|
|
+ HANTRO_VP8_DECODER | HANTRO_H264_DECODER,
|
|
.codec_ops = rk3399_vpu_codec_ops,
|
|
.irqs = rk3399_irqs,
|
|
.num_irqs = ARRAY_SIZE(rk3399_irqs),
|
|
--
|
|
2.17.1
|
|
|
|
|
|
From 51ec7c26733bd0c96fc9ec7d80b18ee8110d0a7d Mon Sep 17 00:00:00 2001
|
|
From: Jonas Karlman <jonas@kwiboo.se>
|
|
Date: Sun, 18 Aug 2019 10:40:31 +0000
|
|
Subject: [PATCH] media: hantro: Enable H264 decoding on RK3328
|
|
|
|
RK3328 SoC has the same decoder IP block as RK3399,
|
|
lets enable H264 decoding on RK3328.
|
|
|
|
Signed-off-by: Jonas Karlman <jonas@kwiboo.se>
|
|
---
|
|
drivers/staging/media/hantro/rk3399_vpu_hw.c | 3 ++-
|
|
1 file changed, 2 insertions(+), 1 deletion(-)
|
|
|
|
diff --git a/drivers/staging/media/hantro/rk3399_vpu_hw.c b/drivers/staging/media/hantro/rk3399_vpu_hw.c
|
|
index 3e05cd2c870e..78f878ca01ff 100644
|
|
--- a/drivers/staging/media/hantro/rk3399_vpu_hw.c
|
|
+++ b/drivers/staging/media/hantro/rk3399_vpu_hw.c
|
|
@@ -232,7 +232,8 @@ const struct hantro_variant rk3328_vpu_variant = {
|
|
.dec_offset = 0x400,
|
|
.dec_fmts = rk3399_vpu_dec_fmts,
|
|
.num_dec_fmts = ARRAY_SIZE(rk3399_vpu_dec_fmts),
|
|
- .codec = HANTRO_MPEG2_DECODER | HANTRO_VP8_DECODER,
|
|
+ .codec = HANTRO_MPEG2_DECODER | HANTRO_VP8_DECODER |
|
|
+ HANTRO_H264_DECODER,
|
|
.codec_ops = rk3399_vpu_codec_ops,
|
|
.irqs = rk3328_irqs,
|
|
.num_irqs = ARRAY_SIZE(rk3328_irqs),
|
|
--
|
|
2.17.1
|
|
|