[PATCH 3/7] media: hantro: vp9: add support for legacy register set
Andrzej Pietrasiewicz
andrzej.p at collabora.com
Tue Nov 23 04:06:26 PST 2021
Hi Jernej,
W dniu 22.11.2021 o 19:46, Jernej Skrabec pisze:
> Some older G2 cores uses slightly different register set for HEVC and
> VP9. Since vast majority of registers and logic is the same, it doesn't
> make sense to introduce another drivers.
>
> Add legacy_regs quirk and implement only VP9 changes for now. HEVC
> changes will be introduced later, if needed.
>
> Signed-off-by: Jernej Skrabec <jernej.skrabec at gmail.com>
> ---
> drivers/staging/media/hantro/hantro.h | 2 +
> drivers/staging/media/hantro/hantro_g2_regs.h | 19 +++++
> .../staging/media/hantro/hantro_g2_vp9_dec.c | 74 ++++++++++++++-----
> 3 files changed, 78 insertions(+), 17 deletions(-)
>
> diff --git a/drivers/staging/media/hantro/hantro.h b/drivers/staging/media/hantro/hantro.h
> index d03824fa3222..83ed25d9657b 100644
> --- a/drivers/staging/media/hantro/hantro.h
> +++ b/drivers/staging/media/hantro/hantro.h
> @@ -74,6 +74,7 @@ struct hantro_irq {
> * @reg_names: array of register range names
> * @num_regs: number of register range names in the array
> * @double_buffer: core needs double buffering
> + * @legacy_regs: core uses legacy register set
> */
> struct hantro_variant {
> unsigned int enc_offset;
> @@ -96,6 +97,7 @@ struct hantro_variant {
> const char * const *reg_names;
> int num_regs;
> unsigned int double_buffer : 1;
> + unsigned int legacy_regs : 1;
> };
>
> /**
> diff --git a/drivers/staging/media/hantro/hantro_g2_regs.h b/drivers/staging/media/hantro/hantro_g2_regs.h
> index 15a391a4650e..d7c2ff05208e 100644
> --- a/drivers/staging/media/hantro/hantro_g2_regs.h
> +++ b/drivers/staging/media/hantro/hantro_g2_regs.h
> @@ -37,6 +37,13 @@
>
> #define g2_strm_swap G2_DEC_REG(2, 28, 0xf)
> #define g2_dirmv_swap G2_DEC_REG(2, 20, 0xf)
> +/* used on older variants */
> +#define g2_strm_swap_old G2_DEC_REG(2, 27, 0x1f)
> +#define g2_pic_swap G2_DEC_REG(2, 22, 0x1f)
> +#define g2_dirmv_swap_old G2_DEC_REG(2, 17, 0x1f)
> +#define g2_tab0_swap G2_DEC_REG(2, 12, 0x1f)
> +#define g2_tab1_swap G2_DEC_REG(2, 7, 0x1f)
> +#define g2_tab2_swap G2_DEC_REG(2, 2, 0x1f)\
Please rename g2_tab[0-2]_swap to g2_tab[0-2]_swap_old. Similar names
exist in newer variants (even if not used at the moment).
It is rather difficult to come up with a consistent rule with regard
to in what sequence to arrange these register definitions. It seems
to me that you use a hybrid approach: if the definitions being added
fall "out of order" then you annotate with a comment about older variants,
and if they are "in order" then you simply fold them into their place.
I don't have a very strong opinion, but maybe they all should be
just "in bitfield order" and without comments?
>
> #define g2_mode G2_DEC_REG(3, 27, 0x1f)
> #define g2_compress_swap G2_DEC_REG(3, 20, 0xf)
> @@ -45,6 +52,8 @@
> #define g2_out_dis G2_DEC_REG(3, 15, 0x1)
> #define g2_out_filtering_dis G2_DEC_REG(3, 14, 0x1)
> #define g2_write_mvs_e G2_DEC_REG(3, 12, 0x1)
> +#define g2_tab3_swap G2_DEC_REG(3, 7, 0x1f)
g2_tab3_swap_old
With all the above addressed you can add my
Reviewied-by: Andrzej Pietrasiewicz <andrzej.p at collabora.com>
> +#define g2_rscan_swap G2_DEC_REG(3, 2, 0x1f)
>
> #define g2_pic_width_in_cbs G2_DEC_REG(4, 19, 0x1fff)
> #define g2_pic_height_in_cbs G2_DEC_REG(4, 6, 0x1fff)
> @@ -58,6 +67,7 @@
> #define g2_tempor_mvp_e G2_DEC_REG(5, 11, 0x1)
> #define g2_max_cu_qpd_depth G2_DEC_REG(5, 5, 0x3f)
> #define g2_cu_qpd_e G2_DEC_REG(5, 4, 0x1)
> +#define g2_pix_shift G2_DEC_REG(5, 0, 0xf)
>
> #define g2_stream_len G2_DEC_REG(6, 0, 0xffffffff)
>
> @@ -80,6 +90,8 @@
>
> #define g2_const_intra_e G2_DEC_REG(8, 31, 0x1)
> #define g2_filt_ctrl_pres G2_DEC_REG(8, 30, 0x1)
> +#define g2_bit_depth_y G2_DEC_REG(8, 21, 0xf)
> +#define g2_bit_depth_c G2_DEC_REG(8, 17, 0xf)
> #define g2_idr_pic_e G2_DEC_REG(8, 16, 0x1)
> #define g2_bit_depth_pcm_y G2_DEC_REG(8, 12, 0xf)
> #define g2_bit_depth_pcm_c G2_DEC_REG(8, 8, 0xf)
> @@ -87,6 +99,9 @@
> #define g2_bit_depth_c_minus8 G2_DEC_REG(8, 4, 0x3)
> #define g2_output_8_bits G2_DEC_REG(8, 3, 0x1)
> #define g2_output_format G2_DEC_REG(8, 0, 0x7)
> +/* used on older variants */
> +#define g2_rs_out_bit_depth G2_DEC_REG(8, 4, 0xf)
> +#define g2_pp_pix_shift G2_DEC_REG(8, 0, 0xf)
>
> #define g2_refidx1_active G2_DEC_REG(9, 19, 0x1f)
> #define g2_refidx0_active G2_DEC_REG(9, 14, 0x1f)
> @@ -98,6 +113,10 @@
> #define g2_num_tile_rows G2_DEC_REG(10, 14, 0x1f)
> #define g2_tile_e G2_DEC_REG(10, 1, 0x1)
> #define g2_entropy_sync_e G2_DEC_REG(10, 0, 0x1)
> +/* used on older variants */
> +#define g2_init_qp_old G2_DEC_REG(10, 25, 0x3f)
> +#define g2_num_tile_cols_old G2_DEC_REG(10, 20, 0x1f)
> +#define g2_num_tile_rows_old G2_DEC_REG(10, 15, 0x1f)
>
> #define vp9_transform_mode G2_DEC_REG(11, 27, 0x7)
> #define vp9_filt_sharpness G2_DEC_REG(11, 21, 0x7)
> diff --git a/drivers/staging/media/hantro/hantro_g2_vp9_dec.c b/drivers/staging/media/hantro/hantro_g2_vp9_dec.c
> index d4fc649a4da1..5aac32700cd0 100644
> --- a/drivers/staging/media/hantro/hantro_g2_vp9_dec.c
> +++ b/drivers/staging/media/hantro/hantro_g2_vp9_dec.c
> @@ -150,7 +150,8 @@ static void config_output(struct hantro_ctx *ctx,
> dma_addr_t luma_addr, chroma_addr, mv_addr;
>
> hantro_reg_write(ctx->dev, &g2_out_dis, 0);
> - hantro_reg_write(ctx->dev, &g2_output_format, 0);
> + if (!ctx->dev->variant->legacy_regs)
> + hantro_reg_write(ctx->dev, &g2_output_format, 0);
>
> luma_addr = hantro_get_dec_buf_addr(ctx, &dst->base.vb.vb2_buf);
> hantro_write_addr(ctx->dev, G2_OUT_LUMA_ADDR, luma_addr);
> @@ -327,6 +328,7 @@ config_tiles(struct hantro_ctx *ctx,
> struct hantro_aux_buf *tile_edge = &vp9_ctx->tile_edge;
> dma_addr_t addr;
> unsigned short *tile_mem;
> + unsigned int rows, cols;
>
> addr = misc->dma + vp9_ctx->tile_info_offset;
> hantro_write_addr(ctx->dev, G2_TILE_SIZES_ADDR, addr);
> @@ -344,17 +346,24 @@ config_tiles(struct hantro_ctx *ctx,
>
> fill_tile_info(ctx, tile_r, tile_c, sbs_r, sbs_c, tile_mem);
>
> + cols = tile_c;
> + rows = tile_r;
> hantro_reg_write(ctx->dev, &g2_tile_e, 1);
> - hantro_reg_write(ctx->dev, &g2_num_tile_cols, tile_c);
> - hantro_reg_write(ctx->dev, &g2_num_tile_rows, tile_r);
> -
> } else {
> tile_mem[0] = hantro_vp9_num_sbs(dst->vp9.width);
> tile_mem[1] = hantro_vp9_num_sbs(dst->vp9.height);
>
> + cols = 1;
> + rows = 1;
> hantro_reg_write(ctx->dev, &g2_tile_e, 0);
> - hantro_reg_write(ctx->dev, &g2_num_tile_cols, 1);
> - hantro_reg_write(ctx->dev, &g2_num_tile_rows, 1);
> + }
> +
> + if (ctx->dev->variant->legacy_regs) {
> + hantro_reg_write(ctx->dev, &g2_num_tile_cols_old, cols);
> + hantro_reg_write(ctx->dev, &g2_num_tile_rows_old, rows);
> + } else {
> + hantro_reg_write(ctx->dev, &g2_num_tile_cols, cols);
> + hantro_reg_write(ctx->dev, &g2_num_tile_rows, rows);
> }
>
> /* provide aux buffers even if no tiles are used */
> @@ -505,8 +514,22 @@ static void config_picture_dimensions(struct hantro_ctx *ctx, struct hantro_deco
> static void
> config_bit_depth(struct hantro_ctx *ctx, const struct v4l2_ctrl_vp9_frame *dec_params)
> {
> - hantro_reg_write(ctx->dev, &g2_bit_depth_y_minus8, dec_params->bit_depth - 8);
> - hantro_reg_write(ctx->dev, &g2_bit_depth_c_minus8, dec_params->bit_depth - 8);
> + if (ctx->dev->variant->legacy_regs) {
> + u8 pp_shift = 0;
> +
> + hantro_reg_write(ctx->dev, &g2_bit_depth_y, dec_params->bit_depth);
> + hantro_reg_write(ctx->dev, &g2_bit_depth_c, dec_params->bit_depth);
> + hantro_reg_write(ctx->dev, &g2_rs_out_bit_depth, dec_params->bit_depth);
> +
> + if (dec_params->bit_depth > 8)
> + pp_shift = 16 - dec_params->bit_depth;
> +
> + hantro_reg_write(ctx->dev, &g2_pp_pix_shift, pp_shift);
> + hantro_reg_write(ctx->dev, &g2_pix_shift, 0);
> + } else {
> + hantro_reg_write(ctx->dev, &g2_bit_depth_y_minus8, dec_params->bit_depth - 8);
> + hantro_reg_write(ctx->dev, &g2_bit_depth_c_minus8, dec_params->bit_depth - 8);
> + }
> }
>
> static inline bool is_lossless(const struct v4l2_vp9_quantization *quant)
> @@ -784,9 +807,13 @@ config_source(struct hantro_ctx *ctx, const struct v4l2_ctrl_vp9_frame *dec_para
> + dec_params->compressed_header_size;
>
> stream_base = vb2_dma_contig_plane_dma_addr(&vb2_src->vb2_buf, 0);
> - hantro_write_addr(ctx->dev, G2_STREAM_ADDR, stream_base);
>
> tmp_addr = stream_base + headres_size;
> + if (ctx->dev->variant->legacy_regs)
> + hantro_write_addr(ctx->dev, G2_STREAM_ADDR, (tmp_addr & ~0xf));
> + else
> + hantro_write_addr(ctx->dev, G2_STREAM_ADDR, stream_base);
> +
> start_bit = (tmp_addr & 0xf) * 8;
> hantro_reg_write(ctx->dev, &g2_start_bit, start_bit);
>
> @@ -794,10 +821,12 @@ config_source(struct hantro_ctx *ctx, const struct v4l2_ctrl_vp9_frame *dec_para
> src_len += start_bit / 8 - headres_size;
> hantro_reg_write(ctx->dev, &g2_stream_len, src_len);
>
> - tmp_addr &= ~0xf;
> - hantro_reg_write(ctx->dev, &g2_strm_start_offset, tmp_addr - stream_base);
> - src_buf_len = vb2_plane_size(&vb2_src->vb2_buf, 0);
> - hantro_reg_write(ctx->dev, &g2_strm_buffer_len, src_buf_len);
> + if (!ctx->dev->variant->legacy_regs) {
> + tmp_addr &= ~0xf;
> + hantro_reg_write(ctx->dev, &g2_strm_start_offset, tmp_addr - stream_base);
> + src_buf_len = vb2_plane_size(&vb2_src->vb2_buf, 0);
> + hantro_reg_write(ctx->dev, &g2_strm_buffer_len, src_buf_len);
> + }
> }
>
> static void
> @@ -837,13 +866,24 @@ config_registers(struct hantro_ctx *ctx, const struct v4l2_ctrl_vp9_frame *dec_p
>
> /* configure basic registers */
> hantro_reg_write(ctx->dev, &g2_mode, VP9_DEC_MODE);
> - hantro_reg_write(ctx->dev, &g2_strm_swap, 0xf);
> - hantro_reg_write(ctx->dev, &g2_dirmv_swap, 0xf);
> - hantro_reg_write(ctx->dev, &g2_compress_swap, 0xf);
> + if (!ctx->dev->variant->legacy_regs) {
> + hantro_reg_write(ctx->dev, &g2_strm_swap, 0xf);
> + hantro_reg_write(ctx->dev, &g2_dirmv_swap, 0xf);
> + hantro_reg_write(ctx->dev, &g2_compress_swap, 0xf);
> + hantro_reg_write(ctx->dev, &g2_ref_compress_bypass, 1);
> + } else {
> + hantro_reg_write(ctx->dev, &g2_strm_swap_old, 0x1f);
> + hantro_reg_write(ctx->dev, &g2_pic_swap, 0x10);
> + hantro_reg_write(ctx->dev, &g2_dirmv_swap_old, 0x10);
> + hantro_reg_write(ctx->dev, &g2_tab0_swap, 0x10);
> + hantro_reg_write(ctx->dev, &g2_tab1_swap, 0x10);
> + hantro_reg_write(ctx->dev, &g2_tab2_swap, 0x10);
> + hantro_reg_write(ctx->dev, &g2_tab3_swap, 0x10);
> + hantro_reg_write(ctx->dev, &g2_rscan_swap, 0x10);
> + }
> hantro_reg_write(ctx->dev, &g2_buswidth, BUS_WIDTH_128);
> hantro_reg_write(ctx->dev, &g2_max_burst, 16);
> hantro_reg_write(ctx->dev, &g2_apf_threshold, 8);
> - hantro_reg_write(ctx->dev, &g2_ref_compress_bypass, 1);
> hantro_reg_write(ctx->dev, &g2_clk_gate_e, 1);
> hantro_reg_write(ctx->dev, &g2_max_cb_size, 6);
> hantro_reg_write(ctx->dev, &g2_min_cb_size, 3);
>
More information about the linux-arm-kernel
mailing list