[PATCH 6/7] [media] vcodec: mediatek: Add Mediatek VP9 Video Decoder Driver

Tiffany Lin tiffany.lin at mediatek.com
Wed Apr 13 05:01:54 PDT 2016


Add vp9 decoder driver for MT8173

Signed-off-by: Tiffany Lin <tiffany.lin at mediatek.com>
---
 drivers/media/platform/mtk-vcodec/Makefile         |    1 +
 .../media/platform/mtk-vcodec/vdec/vdec_vp9_if.c   | 1108 ++++++++++++++++++++
 drivers/media/platform/mtk-vcodec/vdec_drv_if.c    |    3 +
 3 files changed, 1112 insertions(+)
 create mode 100644 drivers/media/platform/mtk-vcodec/vdec/vdec_vp9_if.c

diff --git a/drivers/media/platform/mtk-vcodec/Makefile b/drivers/media/platform/mtk-vcodec/Makefile
index 7743c81..852d969 100644
--- a/drivers/media/platform/mtk-vcodec/Makefile
+++ b/drivers/media/platform/mtk-vcodec/Makefile
@@ -5,6 +5,7 @@ obj-$(CONFIG_VIDEO_MEDIATEK_VCODEC) += mtk-vcodec-dec.o \
 
 mtk-vcodec-dec-y := vdec/vdec_h264_if.o \
 		vdec/vdec_vp8_if.o \
+		vdec/vdec_vp9_if.o \
 		mtk_vcodec_dec_drv.o \
 		vdec_drv_if.o \
 		vdec_vpu_if.o \
diff --git a/drivers/media/platform/mtk-vcodec/vdec/vdec_vp9_if.c b/drivers/media/platform/mtk-vcodec/vdec/vdec_vp9_if.c
new file mode 100644
index 0000000..6d0fb68
--- /dev/null
+++ b/drivers/media/platform/mtk-vcodec/vdec/vdec_vp9_if.c
@@ -0,0 +1,1108 @@
+/*
+ * Copyright (c) 2016 MediaTek Inc.
+ * Author: Daniel Hsiao <daniel.hsiao at mediatek.com>
+ *             Kai-Sean Yang <kai-sean.yang at mediatek.com>
+ *		  Tiffany Lin <tiffany.lin at mediatek.com>
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify
+ * it under the terms of the GNU General Public License version 2 as
+ * published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ */
+
+#include <linux/fs.h>
+#include <linux/slab.h>
+#include <linux/syscalls.h>
+#include <linux/delay.h>
+#include <linux/time.h>
+
+#include "mtk_vcodec_intr.h"
+#include "vdec_drv_base.h"
+#include "vdec_vpu_if.h"
+
+#define VP9_SUPER_FRAME_BS_SZ 64
+
+#define REFS_PER_FRAME 3
+#define REF_FRAMES_LOG2 3
+#define REF_FRAMES (1 << REF_FRAMES_LOG2)
+#define VP9_MAX_FRM_BUFF_NUM (9 + 0)
+#define VP9_MAX_FRM_BUFF_NODE_NUM (9 + 9)
+
+
+struct vdec_vp9_frm_hdr {
+	unsigned int width;
+	unsigned int height;
+	unsigned char show_frame;
+	unsigned char resolution_changed;
+};
+
+struct vdec_vp9_work_buf {
+	unsigned int frmbuf_width;
+	unsigned int frmbuf_height;
+	struct mtk_vcodec_mem seg_id_buf;
+	struct mtk_vcodec_mem tile_buf;
+	struct mtk_vcodec_mem count_tbl_buf;
+	struct mtk_vcodec_mem prob_tbl_buf;
+	struct mtk_vcodec_mem mv_buf;
+	struct vdec_fb sf_ref_buf[VP9_MAX_FRM_BUFF_NUM-1];
+};
+
+struct vp9_input_ctx {
+	unsigned long v_fifo_sa;
+	unsigned long v_fifo_ea;
+	unsigned long p_fifo_sa;
+	unsigned long p_fifo_ea;
+	unsigned long v_frm_sa;
+	unsigned long v_frm_ea;
+	unsigned long p_frm_sa;
+	unsigned long p_frm_end;
+	unsigned int frm_sz;
+	unsigned int uncompress_sz;
+};
+
+struct vp9_dram_buf {
+	unsigned long va;
+	unsigned long pa;
+	unsigned int sz;
+	unsigned int vpua;
+};
+
+struct vp9_fb_info {
+	struct vdec_fb *fb;
+	struct vp9_dram_buf y_buf;
+	struct vp9_dram_buf c_buf;
+	struct vp9_dram_buf ufo_len_y;
+	struct vp9_dram_buf ufo_len_c;
+	unsigned int y_width;
+	unsigned int y_height;
+	unsigned int y_crop_width;
+	unsigned int y_crop_height;
+
+	unsigned int c_width;
+	unsigned int c_height;
+	unsigned int c_crop_width;
+	unsigned int c_crop_height;
+
+	unsigned int frm_num;
+};
+
+struct vp9_ref_cnt_buf {
+	struct vp9_fb_info buf;
+	unsigned int ref_cnt;
+};
+
+struct vp9_scale_factors {
+	int x_scale_fp;
+	int y_scale_fp;
+	int x_step_q4;
+	int y_step_q4;
+	unsigned int ref_scaling_en;
+};
+
+struct vp9_ref_buf {
+	struct vp9_fb_info *buf;
+	struct vp9_scale_factors scale_factors;
+	unsigned int idx;
+};
+
+struct vp9_sf_ref_fb {
+	struct vdec_fb fb;
+	int used;
+	int idx;
+};
+
+
+/*
+ * struct vdec_vp9_vsi - shared buffer between host and VPU driver
+ */
+struct vdec_vp9_vsi {
+	unsigned char sf_bs_buf[VP9_SUPER_FRAME_BS_SZ];
+	struct vp9_sf_ref_fb sf_ref_fb[VP9_MAX_FRM_BUFF_NUM-1];
+	int sf_next_ref_fb_idx;
+	unsigned int sf_frm_cnt;
+	unsigned int sf_frm_offset[VP9_MAX_FRM_BUFF_NUM-1];
+	unsigned int sf_frm_sz[VP9_MAX_FRM_BUFF_NUM-1];
+	unsigned int sf_frm_idx;
+	unsigned int sf_init;
+	struct vdec_fb fb;
+	struct mtk_vcodec_mem bs;
+	struct vdec_fb cur_fb;
+	unsigned int pic_w;
+	unsigned int pic_h;
+	unsigned int buf_w;
+	unsigned int buf_h;
+	unsigned int buf_sz_y_bs;
+	unsigned int buf_sz_c_bs;
+	unsigned int buf_len_sz_y;
+	unsigned int buf_len_sz_c;
+	unsigned int profile;
+	unsigned int show_frm;
+	unsigned int show_exist;
+	unsigned int frm_to_show;
+	unsigned int refresh_frm_flags;
+	unsigned int resolution_changed;
+
+	struct vp9_input_ctx input_ctx;
+	struct vp9_ref_cnt_buf frm_bufs[VP9_MAX_FRM_BUFF_NUM];
+	int ref_frm_map[REF_FRAMES];
+	unsigned int new_fb_idx;
+	unsigned int frm_num;
+	struct vp9_dram_buf seg_id_buf;
+	struct vp9_dram_buf tile_buf;
+	struct vp9_dram_buf count_tbl_buf;
+	struct vp9_dram_buf prob_tbl_buf;
+	struct vp9_dram_buf mv_buf;
+	struct vp9_ref_buf frm_refs[REFS_PER_FRAME];
+
+};
+
+struct vdec_vp9_inst {
+	struct vdec_vp9_work_buf work_buf;
+	struct vdec_vp9_frm_hdr frm_hdr;
+	struct vdec_fb_node dec_fb[VP9_MAX_FRM_BUFF_NODE_NUM];
+	struct list_head available_fb_node_list;
+	struct list_head fb_use_list;
+	struct list_head fb_free_list;
+	struct list_head fb_disp_list;
+	struct vdec_fb *cur_fb;
+	unsigned int frm_cnt;
+	unsigned int total_frm_cnt;
+	void *ctx;
+	struct vdec_vpu_inst vpu;
+	struct vdec_vp9_vsi *vsi;
+	unsigned int show_reg;
+	struct file *log;
+	struct mtk_vcodec_mem mem;
+};
+
+static int vp9_setup_buf(struct vdec_vp9_inst *inst)
+{
+	struct vdec_vp9_vsi *vsi = inst->vpu.vsi;
+
+	vsi->mv_buf.va = (unsigned long)inst->work_buf.mv_buf.va;
+	vsi->mv_buf.pa = (unsigned long)inst->work_buf.mv_buf.dma_addr;
+	vsi->mv_buf.sz = (unsigned long)inst->work_buf.mv_buf.size;
+
+	if ((vsi->mv_buf.va == 0) || (vsi->mv_buf.pa == 0) ||
+		(vsi->mv_buf.sz == 0))
+		return -EINVAL;
+
+	mtk_vcodec_debug(inst, "VP9_MV_BUF_Addr: 0x%lX (0x%lX)",
+		     vsi->mv_buf.va, vsi->mv_buf.pa);
+	return 0;
+}
+
+static bool vp9_is_sf_ref_fb(struct vdec_vp9_inst *inst, struct vdec_fb *fb)
+{
+	int i;
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+
+	for (i = 0; i < VP9_MAX_FRM_BUFF_NUM - 1; i++) {
+		if (fb == &vsi->sf_ref_fb[i].fb)
+			break;
+	}
+
+	if (i == VP9_MAX_FRM_BUFF_NUM - 1)
+		return false;
+
+	return true;
+}
+
+static struct vdec_fb *vp9_rm_from_fb_use_list(struct vdec_vp9_inst
+					*inst, void *addr)
+{
+	struct vdec_fb *fb;
+	struct vdec_fb_node *node;
+
+	list_for_each_entry(node, &inst->fb_use_list, list) {
+		fb = (struct vdec_fb *)node->fb;
+		if (fb->base_y.va == addr) {
+			list_move_tail(&node->list,
+				       &inst->available_fb_node_list);
+			break;
+		}
+	}
+
+	return fb;
+}
+
+static bool vp9_add_to_fb_free_list(struct vdec_vp9_inst *inst,
+			     struct vdec_fb *fb)
+{
+	struct vdec_fb_node *node;
+
+	if (fb) {
+		node = list_first_entry_or_null(&inst->available_fb_node_list,
+					struct vdec_fb_node, list);
+		if (node) {
+			node->fb = fb;
+			list_move_tail(&node->list, &inst->fb_free_list);
+		} else
+			mtk_vcodec_debug(inst, "No free fb node");
+	}
+
+	return true;
+}
+
+static bool vp9_free_sf_ref_fb(struct vdec_vp9_inst *inst, struct vdec_fb *fb)
+{
+	struct vp9_sf_ref_fb *sf_ref_fb =
+		container_of(fb, struct vp9_sf_ref_fb, fb);
+
+	sf_ref_fb->used = 0;
+
+	return true;
+}
+
+static void vp9_ref_cnt_fb(struct vdec_vp9_inst *inst, int *idx,
+			   int new_idx)
+{
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+	int ref_idx = *idx;
+
+	if (ref_idx >= 0 && vsi->frm_bufs[ref_idx].ref_cnt > 0) {
+		vsi->frm_bufs[ref_idx].ref_cnt--;
+
+		if (vsi->frm_bufs[ref_idx].ref_cnt == 0) {
+			if (!vp9_is_sf_ref_fb(inst,
+					      vsi->frm_bufs[ref_idx].buf.fb)) {
+				struct vdec_fb *fb;
+
+				fb = vp9_rm_from_fb_use_list(inst,
+				     vsi->frm_bufs[ref_idx].buf.fb->base_y.va);
+				vp9_add_to_fb_free_list(inst, fb);
+			} else
+				vp9_free_sf_ref_fb(
+					inst, vsi->frm_bufs[ref_idx].buf.fb);
+		}
+	}
+
+	*idx = new_idx;
+	vsi->frm_bufs[new_idx].ref_cnt++;
+}
+
+static void vp9_free_all_sf_ref_fb(struct vdec_vp9_inst *inst)
+{
+	int i;
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+
+	for (i = 0; i < VP9_MAX_FRM_BUFF_NUM - 1; i++) {
+		if (inst->work_buf.sf_ref_buf[i].base_y.va) {
+			mtk_vcodec_mem_free(inst->ctx,
+				    &inst->work_buf.sf_ref_buf[i].base_y);
+			mtk_vcodec_mem_free(inst->ctx,
+				    &inst->work_buf.sf_ref_buf[i].base_c);
+			vsi->sf_ref_fb[i].used = 0;
+		}
+	}
+}
+
+static int vp9_get_sf_ref_fb(struct vdec_vp9_inst *inst)
+{
+	int i;
+	struct mtk_vcodec_mem *mem;
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+	struct vdec_fb *fb_dst_ptr, *fb_src_ptr;
+
+	for (i = 0; i < VP9_MAX_FRM_BUFF_NUM - 1; i++) {
+		if (inst->work_buf.sf_ref_buf[i].base_y.va &&
+		    vsi->sf_ref_fb[i].used == 0) {
+			return i;
+		}
+	}
+
+	for (i = 0; i < VP9_MAX_FRM_BUFF_NUM - 1; i++) {
+		if (inst->work_buf.sf_ref_buf[i].base_y.va == NULL)
+			break;
+	}
+
+	if (i == VP9_MAX_FRM_BUFF_NUM - 1) {
+		mtk_vcodec_err(inst, "List Full");
+		return -1;
+	}
+
+	mem = &inst->work_buf.sf_ref_buf[i].base_y;
+	mem->size = vsi->buf_sz_y_bs +
+		    vsi->buf_len_sz_y;
+
+	if ((inst->frm_hdr.width > 4096) ||
+		(inst->frm_hdr.height > 2304)) {
+		mtk_vcodec_err(inst, "Invalid w/h %d/%d",
+			inst->frm_hdr.width,
+			inst->frm_hdr.height);
+		return -1;
+	}
+
+	if (mtk_vcodec_mem_alloc(inst->ctx, mem)) {
+		mtk_vcodec_err(inst, "Cannot allocate sf_ref_buf y_buf");
+		return -1;
+	}
+
+	mtk_vcodec_debug(inst, "allocate sf_ref_buf y_buf = 0x%lx, %d",
+			mem->size,
+			inst->work_buf.frmbuf_width *
+			inst->work_buf.frmbuf_height);
+
+	fb_dst_ptr = &vsi->sf_ref_fb[i].fb;
+	fb_src_ptr = &inst->work_buf.sf_ref_buf[i];
+	fb_dst_ptr->base_y.va = fb_src_ptr->base_y.va;
+	fb_dst_ptr->base_y.dma_addr = fb_src_ptr->base_y.dma_addr;
+	fb_dst_ptr->base_y.size = fb_src_ptr->base_y.size;
+
+	mem = &inst->work_buf.sf_ref_buf[i].base_c;
+	mem->size = vsi->buf_sz_c_bs +
+		    vsi->buf_len_sz_c;
+
+	if (mtk_vcodec_mem_alloc(inst->ctx, mem)) {
+		mtk_vcodec_err(inst, "Cannot allocate sf_ref_buf c_buf");
+		return -1;
+	}
+
+	mtk_vcodec_debug(inst, "allocate sf_ref_buf c_buf = 0x%lx, %d",
+			mem->size,
+			inst->work_buf.frmbuf_width *
+			inst->work_buf.frmbuf_height / 2);
+
+	fb_dst_ptr->base_c.va = fb_src_ptr->base_c.va;
+	fb_dst_ptr->base_c.dma_addr = fb_src_ptr->base_c.dma_addr;
+	fb_dst_ptr->base_c.size = fb_src_ptr->base_c.size;
+
+	vsi->sf_ref_fb[i].used = 0;
+	vsi->sf_ref_fb[i].idx = i;
+
+	return i;
+}
+
+bool vp9_realloc_work_buf(struct vdec_vp9_inst *inst)
+{
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+	int result;
+	struct mtk_vcodec_mem *mem;
+
+	inst->frm_hdr.width = vsi->pic_w;
+	inst->frm_hdr.height = vsi->pic_h;
+	inst->work_buf.frmbuf_width = vsi->buf_w;
+	inst->work_buf.frmbuf_height = vsi->buf_h;
+
+	mtk_vcodec_debug(inst, "BUF CHG(%d): w/h/sb_w/sb_h=%d/%d/%d/%d",
+		     inst->frm_hdr.resolution_changed,
+		     inst->frm_hdr.width,
+		     inst->frm_hdr.height,
+		     inst->work_buf.frmbuf_width,
+		     inst->work_buf.frmbuf_height);
+
+	if ((inst->frm_hdr.width > 4096) ||
+		(inst->frm_hdr.height > 2304)) {
+		mtk_vcodec_err(inst, "Invalid w/h %d/%d",
+			inst->frm_hdr.width,
+			inst->frm_hdr.height);
+		return false;
+	}
+
+	mem = &inst->work_buf.mv_buf;
+	/* Free First */
+	if (mem->va)
+		mtk_vcodec_mem_free(inst->ctx, mem);
+	/* Alloc Later */
+	mem->size = ((inst->work_buf.frmbuf_width / 64) *
+		    (inst->work_buf.frmbuf_height / 64) + 2) * 36 * 16;
+
+	result = mtk_vcodec_mem_alloc(inst->ctx, mem);
+	if (result) {
+		mtk_vcodec_err(inst, "Cannot allocate mv_buf");
+		return false;
+	}
+	/* Set the va again */
+	vsi->mv_buf.va = (unsigned long)inst->work_buf.mv_buf.va;
+	vsi->mv_buf.pa = (unsigned long)inst->work_buf.mv_buf.dma_addr;
+	vsi->mv_buf.sz = (unsigned long)inst->work_buf.mv_buf.size;
+
+	vp9_free_all_sf_ref_fb(inst);
+	vsi->sf_next_ref_fb_idx = vp9_get_sf_ref_fb(inst);
+	result = vp9_setup_buf(inst);
+	if (result) {
+		mtk_vcodec_err(inst, "Cannot vp9_setup_buf");
+		return false;
+	}
+
+	inst->frm_hdr.resolution_changed = true;
+
+	return true;
+}
+
+static bool vp9_add_to_fb_disp_list(struct vdec_vp9_inst *inst,
+			     struct vdec_fb *fb)
+{
+	struct vdec_fb_node *node;
+
+	if (!fb)
+		return false;
+
+	node = list_first_entry_or_null(&inst->available_fb_node_list,
+					struct vdec_fb_node, list);
+	if (node) {
+		node->fb = fb;
+		list_move_tail(&node->list, &inst->fb_disp_list);
+	} else {
+		mtk_vcodec_debug(inst, "List Full");
+		return false;
+	}
+
+	mtk_vcodec_debug_leave(inst);
+
+	return true;
+}
+
+static void vp9_swap_frm_bufs(struct vdec_vp9_inst *inst)
+{
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+	struct vp9_fb_info *frm_to_show;
+	int ref_index = 0, mask;
+
+	for (mask = vsi->refresh_frm_flags; mask; mask >>= 1) {
+		if (mask & 1)
+			vp9_ref_cnt_fb(inst, &vsi->ref_frm_map[ref_index],
+				       vsi->new_fb_idx);
+		++ref_index;
+	}
+
+	frm_to_show = &vsi->frm_bufs[vsi->new_fb_idx].buf;
+	vsi->frm_bufs[vsi->new_fb_idx].ref_cnt--;
+
+	if (frm_to_show->fb != inst->cur_fb) {
+		if ((frm_to_show->fb != NULL) &&
+			(inst->cur_fb->base_y.size >=
+				frm_to_show->fb->base_y.size)) {
+			memcpy((void *)inst->cur_fb->base_y.va,
+				(void *)frm_to_show->fb->base_y.va,
+				inst->work_buf.frmbuf_width *
+				inst->work_buf.frmbuf_height);
+			memcpy((void *)inst->cur_fb->base_c.va,
+				(void *)frm_to_show->fb->base_c.va,
+				inst->work_buf.frmbuf_width *
+				inst->work_buf.frmbuf_height / 2);
+		} else {
+			mtk_vcodec_debug(inst,
+				"inst->cur_fb->base_y.size=%lx, frm_to_show->fb.base_y.size=%lx",
+				inst->cur_fb->base_y.size,
+				frm_to_show->fb->base_y.size);
+		}
+		if (!vp9_is_sf_ref_fb(inst, inst->cur_fb)) {
+			if (inst->frm_hdr.show_frame)
+				vp9_add_to_fb_disp_list(inst, inst->cur_fb);
+		}
+	} else {
+		if (!vp9_is_sf_ref_fb(inst, inst->cur_fb)) {
+			if (inst->frm_hdr.show_frame)
+				vp9_add_to_fb_disp_list(inst, frm_to_show->fb);
+		}
+	}
+
+	if (vsi->frm_bufs[vsi->new_fb_idx].ref_cnt == 0) {
+		if (!vp9_is_sf_ref_fb(
+			inst, vsi->frm_bufs[vsi->new_fb_idx].buf.fb)) {
+			struct vdec_fb *fb;
+
+			fb = vp9_rm_from_fb_use_list(inst,
+			     vsi->frm_bufs[vsi->new_fb_idx].buf.fb->base_y.va);
+
+			vp9_add_to_fb_free_list(inst, fb);
+		} else
+			vp9_free_sf_ref_fb(
+				inst, vsi->frm_bufs[vsi->new_fb_idx].buf.fb);
+	}
+
+	if (vsi->sf_frm_cnt > 0 && vsi->sf_frm_idx != vsi->sf_frm_cnt - 1)
+		vsi->sf_next_ref_fb_idx = vp9_get_sf_ref_fb(inst);
+}
+
+static bool vp9_wait_dec_end(struct vdec_vp9_inst *inst)
+{
+	struct mtk_vcodec_ctx *ctx = inst->ctx;
+	unsigned int irq_status;
+
+	mtk_vcodec_wait_for_done_ctx(inst->ctx,
+						MTK_INST_IRQ_RECEIVED,
+						WAIT_INTR_TIMEOUT_MS);
+
+	irq_status = ctx->irq_status;
+	mtk_vcodec_debug(inst, "isr return %x", irq_status);
+
+	if (irq_status & 0x10000)
+		return true;
+	else
+		return false;
+}
+
+struct vdec_vp9_inst *vp9_alloc_inst(void *ctx)
+{
+	int result;
+	struct mtk_vcodec_mem mem;
+	struct vdec_vp9_inst *inst;
+
+	mem.size = sizeof(struct vdec_vp9_inst) * 2;
+	result = mtk_vcodec_mem_alloc(ctx, &mem);
+	if (result)
+		return NULL;
+
+	inst = mem.va;
+	inst->mem = mem;
+
+	return inst;
+}
+
+void vp9_free_handle(struct vdec_vp9_inst *inst)
+{
+	struct mtk_vcodec_mem mem;
+
+	mem = inst->mem;
+	if (mem.va)
+		mtk_vcodec_mem_free(inst->ctx, &mem);
+}
+
+bool vp9_init_proc(struct vdec_vp9_inst *inst,
+		   struct vdec_pic_info *pic_info)
+{
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+
+	pic_info->pic_w = vsi->pic_w;
+	pic_info->pic_h = vsi->pic_h;
+	pic_info->buf_w = vsi->buf_w;
+	pic_info->buf_h = vsi->buf_h;
+
+	mtk_vcodec_debug(inst,
+			"(PicW,PicH,BufW,BufH) = (%d,%d,%d,%d) profile=%d",
+			pic_info->pic_w, pic_info->pic_h,
+			pic_info->buf_w, pic_info->buf_h, vsi->profile);
+
+	inst->frm_hdr.width = vsi->pic_w;
+	inst->frm_hdr.height = vsi->pic_h;
+	inst->work_buf.frmbuf_width = vsi->buf_w;
+	inst->work_buf.frmbuf_height = vsi->buf_h;
+
+	/* ----> HW limitation */
+	if ((inst->frm_hdr.width > 4096) ||
+		(inst->frm_hdr.height > 2304)) {
+		mtk_vcodec_err(inst, "Invalid w/h %d/%d",
+			inst->frm_hdr.width,
+			inst->frm_hdr.height);
+		return false;
+	}
+
+	if (vsi->profile > 0) {
+		mtk_vcodec_err(inst, "vp9_dec DO NOT support profile(%d) > 0",
+			     vsi->profile);
+		return false;
+	}
+	if ((inst->work_buf.frmbuf_width > 4096) ||
+	    (inst->work_buf.frmbuf_height > 2304)) {
+		mtk_vcodec_err(inst, "vp9_dec DO NOT support (W,H) = (%d,%d)",
+			     inst->work_buf.frmbuf_width,
+			     inst->work_buf.frmbuf_height);
+		return false;
+	}
+	/* <---- HW limitation */
+
+	return true;
+}
+
+bool vp9_check_proc(struct vdec_vp9_inst *inst)
+{
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+	bool ret = false;
+
+	mtk_vcodec_debug_enter(inst);
+
+	if (vsi->show_exist) {
+		vp9_swap_frm_bufs(inst);
+		mtk_vcodec_debug(inst, "Decode Ok @%d (show_exist)",
+				 vsi->frm_num);
+		vsi->frm_num++;
+		return true;
+	}
+
+	ret = vp9_wait_dec_end(inst);
+	if (!ret) {
+		mtk_vcodec_err(inst, "Decode NG, Decode Timeout @[%d]",
+			       vsi->frm_num);
+		return false;
+	}
+
+	if (vpu_dec_end(&inst->vpu)) {
+		mtk_vcodec_err(inst, "vp9_dec_vpu_end failed");
+		return false;
+	}
+
+	vp9_swap_frm_bufs(inst);
+	mtk_vcodec_debug(inst, "Decode Ok @%d (%d/%d)", vsi->frm_num,
+		     inst->frm_hdr.width, inst->frm_hdr.height);
+
+	vsi->frm_num++;
+
+	mtk_vcodec_debug_leave(inst);
+
+	return true;
+}
+
+bool vp9_is_last_sub_frm(struct vdec_vp9_inst *inst)
+{
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+
+	if (vsi->sf_frm_cnt <= 0 || vsi->sf_frm_idx == vsi->sf_frm_cnt)
+		return true;
+
+	return false;
+}
+
+struct vdec_fb *vp9_rm_from_fb_disp_list(struct vdec_vp9_inst
+		*inst)
+{
+	struct vdec_fb_node *node;
+	struct vdec_fb *fb = NULL;
+
+	node = list_first_entry_or_null(&inst->fb_disp_list,
+					struct vdec_fb_node, list);
+	if (node) {
+		fb = (struct vdec_fb *)node->fb;
+		fb->status |= FB_ST_DISPLAY;
+		list_move_tail(&node->list, &inst->available_fb_node_list);
+		mtk_vcodec_debug(inst, "[FB] get disp fb %p st=%d",
+				 node->fb, fb->status);
+	} else
+		mtk_vcodec_debug(inst, "[FB] there is no disp fb");
+
+	return fb;
+}
+
+bool vp9_add_to_fb_use_list(struct vdec_vp9_inst *inst,
+			    struct vdec_fb *fb)
+{
+	struct vdec_fb_node *node;
+
+	if (!fb)
+		return false;
+
+	node = list_first_entry_or_null(&inst->available_fb_node_list,
+					struct vdec_fb_node, list);
+	if (node) {
+		node->fb = fb;
+		list_move_tail(&node->list, &inst->fb_use_list);
+	} else {
+		mtk_vcodec_debug(inst, "No free fb node");
+		return false;
+	}
+
+	mtk_vcodec_debug_leave(inst);
+
+	return true;
+}
+
+struct vdec_fb *vp9_rm_from_fb_free_list(struct vdec_vp9_inst
+		*inst)
+{
+	struct vdec_fb_node *node;
+	struct vdec_fb *fb = NULL;
+
+	node = list_first_entry_or_null(&inst->fb_free_list,
+					struct vdec_fb_node, list);
+	if (node) {
+		fb = (struct vdec_fb *)node->fb;
+		fb->status |= FB_ST_FREE;
+		list_move_tail(&node->list, &inst->available_fb_node_list);
+		mtk_vcodec_debug(inst, "[FB] get free fb %p st=%d",
+				 node->fb, fb->status);
+	} else
+		mtk_vcodec_debug(inst, "[FB] there is no free fb");
+
+	mtk_vcodec_debug_leave(inst);
+
+	return fb;
+}
+
+bool vp9_fb_use_list_to_fb_free_list(struct vdec_vp9_inst *inst)
+{
+	struct vdec_fb_node *node, *tmp;
+
+	list_for_each_entry_safe(node, tmp, &inst->fb_use_list, list)
+		list_move_tail(&node->list, &inst->fb_free_list);
+
+	mtk_vcodec_debug_leave(inst);
+	return true;
+}
+
+void vp9_reset(struct vdec_vp9_inst *inst)
+{
+	vp9_fb_use_list_to_fb_free_list(inst);
+
+	vp9_free_all_sf_ref_fb(inst);
+	inst->vsi->sf_next_ref_fb_idx = vp9_get_sf_ref_fb(inst);
+
+	if (vpu_dec_reset(&inst->vpu))
+		mtk_vcodec_debug(inst, "vp9_dec_vpu_reset failed");
+
+	if (vp9_setup_buf(inst))
+		mtk_vcodec_debug(inst, "vp9_setup_buf failed");
+}
+
+static void init_list(struct vdec_vp9_inst *inst)
+{
+	int i;
+
+	INIT_LIST_HEAD(&inst->available_fb_node_list);
+	INIT_LIST_HEAD(&inst->fb_use_list);
+	INIT_LIST_HEAD(&inst->fb_free_list);
+	INIT_LIST_HEAD(&inst->fb_disp_list);
+
+	for (i = 0; i < VP9_MAX_FRM_BUFF_NODE_NUM; i++) {
+		INIT_LIST_HEAD(&inst->dec_fb[i].list);
+		inst->dec_fb[i].fb = NULL;
+		list_add_tail(&inst->dec_fb[i].list,
+			      &inst->available_fb_node_list);
+	}
+}
+
+static void get_pic_info(struct vdec_vp9_inst *inst, struct vdec_pic_info *pic)
+{
+
+	pic->y_bs_sz = inst->vsi->buf_sz_y_bs;
+	pic->c_bs_sz = inst->vsi->buf_sz_c_bs;
+	pic->y_len_sz = inst->vsi->buf_len_sz_y;
+	pic->c_len_sz = inst->vsi->buf_len_sz_c;
+
+	pic->pic_w = inst->frm_hdr.width;
+	pic->pic_h = inst->frm_hdr.height;
+	pic->buf_w = inst->work_buf.frmbuf_width;
+	pic->buf_h = inst->work_buf.frmbuf_height;
+
+	mtk_vcodec_debug(inst, "pic(%d, %d), buf(%d, %d)",
+		 pic->pic_w, pic->pic_h, pic->buf_w, pic->buf_h);
+	mtk_vcodec_debug(inst, "Y(%d, %d), C(%d, %d)", pic->y_bs_sz,
+		 pic->y_len_sz, pic->c_bs_sz, pic->c_len_sz);
+}
+
+static void get_disp_fb(struct vdec_vp9_inst *inst, struct vdec_fb **out_fb)
+{
+	mtk_vcodec_debug_enter(inst);
+
+	*out_fb = vp9_rm_from_fb_disp_list(inst);
+	if (*out_fb)
+		(*out_fb)->status |= FB_ST_DISPLAY;
+}
+
+static void get_free_fb(struct vdec_vp9_inst *inst, struct vdec_fb **out_fb)
+{
+	struct vdec_fb_node *node;
+	struct vdec_fb *fb = NULL;
+
+	node = list_first_entry_or_null(&inst->fb_free_list,
+					struct vdec_fb_node, list);
+	if (node) {
+		list_move_tail(&node->list, &inst->available_fb_node_list);
+		fb = (struct vdec_fb *)node->fb;
+		fb->status |= FB_ST_FREE;
+		mtk_vcodec_debug(inst, "[FB] get free fb %p st=%d",
+				 node->fb, fb->status);
+	} else {
+		fb = NULL;
+		mtk_vcodec_debug(inst, "[FB] there is no free fb");
+	}
+
+	*out_fb = fb;
+}
+
+static int vdec_vp9_deinit(unsigned long h_vdec)
+{
+	struct vdec_vp9_inst *inst = (struct vdec_vp9_inst *)h_vdec;
+	struct mtk_vcodec_mem *mem;
+	int ret = 0;
+
+	mtk_vcodec_debug_enter(inst);
+
+	if (vpu_dec_deinit(&inst->vpu)) {
+		mtk_vcodec_err(inst, "[E]vpu_dec_deinit");
+		ret = -EINVAL;
+	}
+
+	mem = &inst->work_buf.mv_buf;
+	if (mem->va)
+		mtk_vcodec_mem_free(inst->ctx, mem);
+
+	vp9_free_all_sf_ref_fb(inst);
+	vp9_free_handle(inst);
+
+	mtk_vcodec_debug_leave(inst);
+
+	return ret;
+}
+
+static int vdec_vp9_init(struct mtk_vcodec_ctx *ctx, unsigned long *h_vdec)
+{
+	struct vdec_vp9_inst *inst;
+
+	inst = vp9_alloc_inst(ctx);
+	if (!inst)
+		return -ENOMEM;
+
+	inst->frm_cnt = 0;
+	inst->total_frm_cnt = 0;
+	inst->ctx = ctx;
+
+	inst->vpu.id = IPI_VDEC_VP9;
+	inst->vpu.dev = ctx->dev->vpu_plat_dev;
+	inst->vpu.ctx = ctx;
+	inst->vpu.handler = vpu_dec_ipi_handler;
+
+	if (vpu_dec_init(&inst->vpu)) {
+		mtk_vcodec_err(inst, "[E]vp9_dec_vpu_init - %d",
+						inst->vpu.inst_addr);
+		goto err_deinit_inst;
+	}
+
+	inst->vsi = (struct vdec_vp9_vsi *)inst->vpu.vsi;
+	init_list(inst);
+
+	(*h_vdec) = (unsigned long)inst;
+	return 0;
+
+err_deinit_inst:
+	vp9_free_handle(inst);
+
+	return -EINVAL;
+}
+
+static int vdec_vp9_decode(unsigned long h_vdec, struct mtk_vcodec_mem *bs,
+		   struct vdec_fb *fb, bool *res_chg)
+{
+	int ret = 0;
+	struct vdec_vp9_inst *inst = (struct vdec_vp9_inst *)h_vdec;
+	struct vdec_vp9_frm_hdr *frm_hdr = &inst->frm_hdr;
+	struct vdec_vp9_vsi *vsi = inst->vsi;
+	unsigned int data[3];
+	int i;
+
+	mtk_vcodec_debug_enter(inst);
+
+	*res_chg = false;
+
+	if ((bs == NULL) && (fb == NULL)) {
+		mtk_vcodec_debug(inst, "[EOS]");
+		vp9_reset(inst);
+		return ret;
+	}
+
+	if (bs != NULL)
+		mtk_vcodec_debug(inst, "Input BS Size = %ld", bs->size);
+
+	memcpy((void *)inst + sizeof(*inst), (void *)inst,
+	       sizeof(*inst));
+
+	while (1) {
+		struct vdec_fb *cur_fb;
+
+		frm_hdr->resolution_changed = false;
+
+		data[0] = *((unsigned int *)bs->va);
+		data[1] = *((unsigned int *)(bs->va + 4));
+		data[2] = *((unsigned int *)(bs->va + 8));
+
+		vsi->bs = *bs;
+
+		if (fb)
+			vsi->fb = *fb;
+
+		if (!vsi->sf_init) {
+			unsigned int sf_bs_sz;
+			unsigned int sf_bs_off;
+			unsigned char *sf_bs_src;
+			unsigned char *sf_bs_dst;
+
+			sf_bs_sz = bs->size > VP9_SUPER_FRAME_BS_SZ ?
+				VP9_SUPER_FRAME_BS_SZ : bs->size;
+			sf_bs_off = VP9_SUPER_FRAME_BS_SZ - sf_bs_sz;
+			sf_bs_src = bs->va + bs->size - sf_bs_sz;
+			sf_bs_dst = vsi->sf_bs_buf + sf_bs_off;
+			memcpy(sf_bs_dst, sf_bs_src, sf_bs_sz);
+		} else {
+			if ((vsi->sf_frm_cnt > 0) &&
+				(vsi->sf_frm_idx < vsi->sf_frm_cnt)) {
+				unsigned int idx = vsi->sf_frm_idx;
+
+				memcpy((void *)vsi->input_ctx.v_frm_sa,
+					   (void *)(vsi->input_ctx.v_frm_sa +
+					   vsi->sf_frm_offset[idx]),
+					   vsi->sf_frm_sz[idx]);
+			}
+		}
+		ret = vpu_dec_start(&inst->vpu, data, 3);
+		if (ret) {
+			mtk_vcodec_err(inst, "vpu_dec_start failed");
+			ret = -EINVAL;
+			goto DECODE_ERROR;
+		}
+
+		if (vsi->resolution_changed) {
+			if (!vp9_realloc_work_buf(inst)) {
+				ret = -EINVAL;
+				goto DECODE_ERROR;
+			}
+		}
+
+		if (vsi->sf_frm_cnt > 0) {
+			cur_fb = &vsi->sf_ref_fb[vsi->sf_next_ref_fb_idx].fb;
+
+			if (vsi->sf_frm_idx < vsi->sf_frm_cnt)
+				inst->cur_fb = cur_fb;
+			else
+				inst->cur_fb = fb;
+		} else {
+			inst->cur_fb = fb;
+		}
+
+		vsi->frm_bufs[vsi->new_fb_idx].buf.fb = inst->cur_fb;
+		if (!vp9_is_sf_ref_fb(inst, inst->cur_fb))
+			vp9_add_to_fb_use_list(inst, inst->cur_fb);
+
+		mtk_vcodec_debug(inst, "[#pic %d]", vsi->frm_num);
+
+		/* the same as VP9_SKIP_FRAME */
+		inst->frm_hdr.show_frame = vsi->show_frm;
+
+		if (vsi->show_exist)
+			mtk_vcodec_debug(inst,
+				"drv->new_fb_idx=%d, drv->frm_to_show=%d",
+				vsi->new_fb_idx, vsi->frm_to_show);
+
+		if (vsi->show_exist && (vsi->frm_to_show <
+					VP9_MAX_FRM_BUFF_NUM)) {
+			mtk_vcodec_debug(inst,
+				"Skip Decode drv->new_fb_idx=%d, drv->frm_to_show=%d",
+				vsi->new_fb_idx, vsi->frm_to_show);
+			vp9_ref_cnt_fb(inst, &vsi->new_fb_idx,
+							vsi->frm_to_show);
+			ret = -EINVAL;
+			goto DECODE_ERROR;
+		}
+
+		/* VPU assign the buffer pointer in its address space,
+		  * reassign here
+		  */
+		for (i = 0; i < REFS_PER_FRAME; i++) {
+			unsigned int idx = vsi->frm_refs[i].idx;
+
+			vsi->frm_refs[i].buf = &vsi->frm_bufs[idx].buf;
+		}
+
+		if (frm_hdr->resolution_changed) {
+			unsigned int width = inst->frm_hdr.width;
+			unsigned int height = inst->frm_hdr.height;
+			unsigned int frmbuf_width =
+				inst->work_buf.frmbuf_width;
+			unsigned int frmbuf_height =
+				inst->work_buf.frmbuf_height;
+			struct mtk_vcodec_mem tmp_buf =	inst->work_buf.mv_buf;
+			struct vp9_dram_buf tmp_buf2 = vsi->mv_buf;
+			struct vdec_fb tmp_buf3 =
+				inst->work_buf.sf_ref_buf[0];
+
+			memcpy((void *)inst, (void *)inst + sizeof(*inst),
+			       sizeof(*inst));
+
+			inst->frm_hdr.width = width;
+			inst->frm_hdr.height = height;
+			inst->work_buf.frmbuf_width = frmbuf_width;
+			inst->work_buf.frmbuf_height = frmbuf_height;
+			inst->work_buf.mv_buf = tmp_buf;
+			inst->vsi->mv_buf = tmp_buf2;
+			inst->work_buf.sf_ref_buf[0] = tmp_buf3;
+
+			*res_chg = true;
+			mtk_vcodec_debug(inst, "VDEC_ST_RESOLUTION_CHANGED");
+			vp9_add_to_fb_free_list(inst, fb);
+			ret = 0;
+			goto DECODE_ERROR;
+		}
+
+		if (vp9_check_proc(inst) != true) {
+			mtk_vcodec_err(inst, "vp9_check_proc");
+			ret = -EINVAL;
+			goto DECODE_ERROR;
+		}
+
+		inst->total_frm_cnt++;
+		if (vp9_is_last_sub_frm(inst))
+			break;
+
+		/* for resolution change backup */
+		memcpy((void *)inst + sizeof(*inst), (void *)inst,
+		       sizeof(*inst));
+	}
+	inst->frm_cnt++;
+
+	mtk_vcodec_debug_leave(inst);
+
+DECODE_ERROR:
+	if (ret < 0)
+		vp9_add_to_fb_free_list(inst, fb);
+
+	mtk_vcodec_debug_leave(inst);
+
+	return ret;
+}
+
+static void get_crop_info(struct vdec_vp9_inst *inst, struct v4l2_crop *cr)
+{
+	cr->c.left = 0;
+	cr->c.top = 0;
+	cr->c.width = inst->frm_hdr.width;
+	cr->c.height = inst->frm_hdr.height;
+	mtk_vcodec_debug(inst, "get crop info l=%d, t=%d, w=%d, h=%d\n",
+			 cr->c.left, cr->c.top, cr->c.width, cr->c.height);
+}
+
+static int vdec_vp9_get_param(unsigned long h_vdec,
+			enum vdec_get_param_type type, void *out)
+{
+	struct vdec_vp9_inst *inst = (struct vdec_vp9_inst *)h_vdec;
+	int ret = 0;
+
+	switch (type) {
+	case GET_PARAM_DISP_FRAME_BUFFER:
+		get_disp_fb(inst, out);
+		break;
+	case GET_PARAM_FREE_FRAME_BUFFER:
+		get_free_fb(inst, out);
+		break;
+	case GET_PARAM_PIC_INFO:
+		get_pic_info(inst, out);
+		break;
+	case GET_PARAM_DPB_SIZE:
+		*((unsigned int *)out) = 9;
+		break;
+	case GET_PARAM_CROP_INFO:
+		get_crop_info(inst, out);
+		break;
+	default:
+		mtk_vcodec_err(inst, "not support type %d", type);
+		ret = -EINVAL;
+		break;
+	}
+
+	return ret;
+}
+
+static struct vdec_common_if vdec_vp9_if = {
+	vdec_vp9_init,
+	vdec_vp9_decode,
+	vdec_vp9_get_param,
+	vdec_vp9_deinit,
+};
+
+struct vdec_common_if *get_vp9_dec_comm_if(void)
+{
+	return &vdec_vp9_if;
+}
diff --git a/drivers/media/platform/mtk-vcodec/vdec_drv_if.c b/drivers/media/platform/mtk-vcodec/vdec_drv_if.c
index 6e2f065..f5781d7 100644
--- a/drivers/media/platform/mtk-vcodec/vdec_drv_if.c
+++ b/drivers/media/platform/mtk-vcodec/vdec_drv_if.c
@@ -26,6 +26,7 @@
 
 struct vdec_common_if *get_h264_dec_comm_if(void);
 struct vdec_common_if *get_vp8_dec_comm_if(void);
+struct vdec_common_if *get_vp9_dec_comm_if(void);
 
 int vdec_if_init(struct mtk_vcodec_ctx *ctx, unsigned int fourcc)
 {
@@ -39,6 +40,8 @@ int vdec_if_init(struct mtk_vcodec_ctx *ctx, unsigned int fourcc)
 		ctx->dec_if = get_vp8_dec_comm_if();
 		break;
 	case V4L2_PIX_FMT_VP9:
+		ctx->dec_if = get_vp9_dec_comm_if();
+		break;
 	default:
 		return -EINVAL;
 	}
-- 
1.7.9.5




More information about the Linux-mediatek mailing list