// SPDX-License-Identifier: GPL-2.0 /* * Copyright (c) 2016 MediaTek Inc. * Author: PC Chen */ #include #include #include "../vdec_drv_if.h" #include "../mtk_vcodec_util.h" #include "../mtk_vcodec_dec.h" #include "../mtk_vcodec_intr.h" #include "../vdec_vpu_if.h" #include "../vdec_drv_base.h" #define NAL_NON_IDR_SLICE 0x01 #define NAL_IDR_SLICE 0x05 #define NAL_H264_PPS 0x08 #define NAL_TYPE(value) ((value) & 0x1F) #define BUF_PREDICTION_SZ (32 * 1024) #define MB_UNIT_LEN 16 /* motion vector size (bytes) for every macro block */ #define HW_MB_STORE_SZ 64 #define H264_MAX_FB_NUM 17 #define HDR_PARSING_BUF_SZ 1024 #define DEC_ERR_RET(ret) ((ret) >> 16) #define H264_ERR_NOT_VALID 3 /** * struct h264_fb - h264 decode frame buffer information * @vdec_fb_va : virtual address of struct vdec_fb * @y_fb_dma : dma address of Y frame buffer (luma) * @c_fb_dma : dma address of C frame buffer (chroma) * @poc : picture order count of frame buffer * @reserved : for 8 bytes alignment */ struct h264_fb { uint64_t vdec_fb_va; uint64_t y_fb_dma; uint64_t c_fb_dma; int32_t poc; uint32_t reserved; }; /** * struct h264_ring_fb_list - ring frame buffer list * @fb_list : frame buffer array * @read_idx : read index * @write_idx : write index * @count : buffer count in list * @reserved : for 8 bytes alignment */ struct h264_ring_fb_list { struct h264_fb fb_list[H264_MAX_FB_NUM]; unsigned int read_idx; unsigned int write_idx; unsigned int count; unsigned int reserved; }; /** * struct vdec_h264_dec_info - decode information * @dpb_sz : decoding picture buffer size * @resolution_changed : resolution change happen * @realloc_mv_buf : flag to notify driver to re-allocate mv buffer * @reserved : for 8 bytes alignment * @bs_dma : Input bit-stream buffer dma address * @y_fb_dma : Y frame buffer dma address * @c_fb_dma : C frame buffer dma address * @vdec_fb_va : VDEC frame buffer struct virtual address */ struct vdec_h264_dec_info { uint32_t dpb_sz; uint32_t resolution_changed; uint32_t realloc_mv_buf; uint32_t reserved; uint64_t bs_dma; uint64_t y_fb_dma; uint64_t c_fb_dma; uint64_t vdec_fb_va; }; /** * struct vdec_h264_vsi - shared memory for decode information exchange * between VPU and Host. * The memory is allocated by VPU then mapping to Host * in vpu_dec_init() and freed in vpu_dec_deinit() * by VPU. * AP-W/R : AP is writer/reader on this item * VPU-W/R: VPU is write/reader on this item * @hdr_buf : Header parsing buffer (AP-W, VPU-R) * @pred_buf_dma : HW working predication buffer dma address (AP-W, VPU-R) * @mv_buf_dma : HW working motion vector buffer dma address (AP-W, VPU-R) * @list_free : free frame buffer ring list (AP-W/R, VPU-W) * @list_disp : display frame buffer ring list (AP-R, VPU-W) * @dec : decode information (AP-R, VPU-W) * @pic : picture information (AP-R, VPU-W) * @crop : crop information (AP-R, VPU-W) */ struct vdec_h264_vsi { unsigned char hdr_buf[HDR_PARSING_BUF_SZ]; uint64_t pred_buf_dma; uint64_t mv_buf_dma[H264_MAX_FB_NUM]; struct h264_ring_fb_list list_free; struct h264_ring_fb_list list_disp; struct vdec_h264_dec_info dec; struct vdec_pic_info pic; struct v4l2_rect crop; }; /** * struct vdec_h264_inst - h264 decoder instance * @num_nalu : how many nalus be decoded * @ctx : point to mtk_vcodec_ctx * @pred_buf : HW working predication buffer * @mv_buf : HW working motion vector buffer * @vpu : VPU instance * @vsi : VPU shared information */ struct vdec_h264_inst { unsigned int num_nalu; struct mtk_vcodec_ctx *ctx; struct mtk_vcodec_mem pred_buf; struct mtk_vcodec_mem mv_buf[H264_MAX_FB_NUM]; struct vdec_vpu_inst vpu; struct vdec_h264_vsi *vsi; }; static unsigned int get_mv_buf_size(unsigned int width, unsigned int height) { return HW_MB_STORE_SZ * (width/MB_UNIT_LEN) * (height/MB_UNIT_LEN); } static int allocate_predication_buf(struct vdec_h264_inst *inst) { int err = 0; inst->pred_buf.size = BUF_PREDICTION_SZ; err = mtk_vcodec_mem_alloc(inst->ctx, &inst->pred_buf); if (err) { mtk_vcodec_err(inst, "failed to allocate ppl buf"); return err; } inst->vsi->pred_buf_dma = inst->pred_buf.dma_addr; return 0; } static void free_predication_buf(struct vdec_h264_inst *inst) { struct mtk_vcodec_mem *mem = NULL; mtk_vcodec_debug_enter(inst); inst->vsi->pred_buf_dma = 0; mem = &inst->pred_buf; if (mem->va) mtk_vcodec_mem_free(inst->ctx, mem); } static int alloc_mv_buf(struct vdec_h264_inst *inst, struct vdec_pic_info *pic) { int i; int err; struct mtk_vcodec_mem *mem = NULL; unsigned int buf_sz = get_mv_buf_size(pic->buf_w, pic->buf_h); for (i = 0; i < H264_MAX_FB_NUM; i++) { mem = &inst->mv_buf[i]; if (mem->va) mtk_vcodec_mem_free(inst->ctx, mem); mem->size = buf_sz; err = mtk_vcodec_mem_alloc(inst->ctx, mem); if (err) { mtk_vcodec_err(inst, "failed to allocate mv buf"); return err; } inst->vsi->mv_buf_dma[i] = mem->dma_addr; } return 0; } static void free_mv_buf(struct vdec_h264_inst *inst) { int i; struct mtk_vcodec_mem *mem = NULL; for (i = 0; i < H264_MAX_FB_NUM; i++) { inst->vsi->mv_buf_dma[i] = 0; mem = &inst->mv_buf[i]; if (mem->va) mtk_vcodec_mem_free(inst->ctx, mem); } } static int check_list_validity(struct vdec_h264_inst *inst, bool disp_list) { struct h264_ring_fb_list *list; list = disp_list ? &inst->vsi->list_disp : &inst->vsi->list_free; if (list->count > H264_MAX_FB_NUM || list->read_idx >= H264_MAX_FB_NUM || list->write_idx >= H264_MAX_FB_NUM) { mtk_vcodec_err(inst, "%s list err: cnt=%d r_idx=%d w_idx=%d", disp_list ? "disp" : "free", list->count, list->read_idx, list->write_idx); return -EINVAL; } return 0; } static void put_fb_to_free(struct vdec_h264_inst *inst, struct vdec_fb *fb) { struct h264_ring_fb_list *list; if (fb) { if (check_list_validity(inst, false)) return; list = &inst->vsi->list_free; if (list->count == H264_MAX_FB_NUM) { mtk_vcodec_err(inst, "[FB] put fb free_list full"); return; } mtk_vcodec_debug(inst, "[FB] put fb into free_list @(%p, %llx)", fb->base_y.va, (u64)fb->base_y.dma_addr); list->fb_list[list->write_idx].vdec_fb_va = (u64)(uintptr_t)fb; list->write_idx = (list->write_idx == H264_MAX_FB_NUM - 1) ? 0 : list->write_idx + 1; list->count++; } } static void get_pic_info(struct vdec_h264_inst *inst, struct vdec_pic_info *pic) { *pic = inst->vsi->pic; mtk_vcodec_debug(inst, "pic(%d, %d), buf(%d, %d)", pic->pic_w, pic->pic_h, pic->buf_w, pic->buf_h); mtk_vcodec_debug(inst, "fb size: Y(%d), C(%d)", pic->fb_sz[0], pic->fb_sz[1]); } static void get_crop_info(struct vdec_h264_inst *inst, struct v4l2_rect *cr) { cr->left = inst->vsi->crop.left; cr->top = inst->vsi->crop.top; cr->width = inst->vsi->crop.width; cr->height = inst->vsi->crop.height; mtk_vcodec_debug(inst, "l=%d, t=%d, w=%d, h=%d", cr->left, cr->top, cr->width, cr->height); } static void get_dpb_size(struct vdec_h264_inst *inst, unsigned int *dpb_sz) { *dpb_sz = inst->vsi->dec.dpb_sz; mtk_vcodec_debug(inst, "sz=%d", *dpb_sz); } static int vdec_h264_init(struct mtk_vcodec_ctx *ctx) { struct vdec_h264_inst *inst = NULL; int err; inst = kzalloc(sizeof(*inst), GFP_KERNEL); if (!inst) return -ENOMEM; inst->ctx = ctx; inst->vpu.id = IPI_VDEC_H264; inst->vpu.ctx = ctx; err = vpu_dec_init(&inst->vpu); if (err) { mtk_vcodec_err(inst, "vdec_h264 init err=%d", err); goto error_free_inst; } inst->vsi = (struct vdec_h264_vsi *)inst->vpu.vsi; err = allocate_predication_buf(inst); if (err) goto error_deinit; mtk_vcodec_debug(inst, "H264 Instance >> %p", inst); ctx->drv_handle = inst; return 0; error_deinit: vpu_dec_deinit(&inst->vpu); error_free_inst: kfree(inst); return err; } static void vdec_h264_deinit(void *h_vdec) { struct vdec_h264_inst *inst = (struct vdec_h264_inst *)h_vdec; mtk_vcodec_debug_enter(inst); vpu_dec_deinit(&inst->vpu); free_predication_buf(inst); free_mv_buf(inst); kfree(inst); } static int find_start_code(unsigned char *data, unsigned int data_sz) { if (data_sz > 3 && data[0] == 0 && data[1] == 0 && data[2] == 1) return 3; if (data_sz > 4 && data[0] == 0 && data[1] == 0 && data[2] == 0 && data[3] == 1) return 4; return -1; } static int vdec_h264_decode(void *h_vdec, struct mtk_vcodec_mem *bs, struct vdec_fb *fb, bool *res_chg) { struct vdec_h264_inst *inst = (struct vdec_h264_inst *)h_vdec; struct vdec_vpu_inst *vpu = &inst->vpu; int nal_start_idx = 0; int err = 0; unsigned int nal_start; unsigned int nal_type; unsigned char *buf; unsigned int buf_sz; unsigned int data[2]; uint64_t vdec_fb_va = (u64)(uintptr_t)fb; uint64_t y_fb_dma = fb ? (u64)fb->base_y.dma_addr : 0; uint64_t c_fb_dma = fb ? (u64)fb->base_c.dma_addr : 0; mtk_vcodec_debug(inst, "+ [%d] FB y_dma=%llx c_dma=%llx va=%p", ++inst->num_nalu, y_fb_dma, c_fb_dma, fb); /* bs NULL means flush decoder */ if (bs == NULL) return vpu_dec_reset(vpu); buf = (unsigned char *)bs->va; buf_sz = bs->size; nal_start_idx = find_start_code(buf, buf_sz); if (nal_start_idx < 0) { mtk_vcodec_err(inst, "invalid nal start code"); err = -EIO; goto err_free_fb_out; } nal_start = buf[nal_start_idx]; nal_type = NAL_TYPE(buf[nal_start_idx]); mtk_vcodec_debug(inst, "\n + NALU[%d] type %d +\n", inst->num_nalu, nal_type); if (nal_type == NAL_H264_PPS) { buf_sz -= nal_start_idx; if (buf_sz > HDR_PARSING_BUF_SZ) { err = -EILSEQ; goto err_free_fb_out; } memcpy(inst->vsi->hdr_buf, buf + nal_start_idx, buf_sz); } inst->vsi->dec.bs_dma = (uint64_t)bs->dma_addr; inst->vsi->dec.y_fb_dma = y_fb_dma; inst->vsi->dec.c_fb_dma = c_fb_dma; inst->vsi->dec.vdec_fb_va = vdec_fb_va; data[0] = buf_sz; data[1] = nal_start; err = vpu_dec_start(vpu, data, 2); if (err) { if (err > 0 && (DEC_ERR_RET(err) == H264_ERR_NOT_VALID)) { mtk_vcodec_err(inst, "- error bitstream - err = %d -", err); err = -EIO; } goto err_free_fb_out; } *res_chg = inst->vsi->dec.resolution_changed; if (*res_chg) { struct vdec_pic_info pic; mtk_vcodec_debug(inst, "- resolution changed -"); get_pic_info(inst, &pic); if (inst->vsi->dec.realloc_mv_buf) { err = alloc_mv_buf(inst, &pic); if (err) goto err_free_fb_out; } } if (nal_type == NAL_NON_IDR_SLICE || nal_type == NAL_IDR_SLICE) { /* wait decoder done interrupt */ err = mtk_vcodec_wait_for_done_ctx(inst->ctx, MTK_INST_IRQ_RECEIVED, WAIT_INTR_TIMEOUT_MS); if (err) goto err_free_fb_out; vpu_dec_end(vpu); } mtk_vcodec_debug(inst, "\n - NALU[%d] type=%d -\n", inst->num_nalu, nal_type); return 0; err_free_fb_out: put_fb_to_free(inst, fb); mtk_vcodec_err(inst, "\n - NALU[%d] err=%d -\n", inst->num_nalu, err); return err; } static void vdec_h264_get_fb(struct vdec_h264_inst *inst, struct h264_ring_fb_list *list, bool disp_list, struct vdec_fb **out_fb) { struct vdec_fb *fb; if (check_list_validity(inst, disp_list)) return; if (list->count == 0) { mtk_vcodec_debug(inst, "[FB] there is no %s fb", disp_list ? "disp" : "free"); *out_fb = NULL; return; } fb = (struct vdec_fb *) (uintptr_t)list->fb_list[list->read_idx].vdec_fb_va; fb->status |= (disp_list ? FB_ST_DISPLAY : FB_ST_FREE); *out_fb = fb; mtk_vcodec_debug(inst, "[FB] get %s fb st=%d poc=%d %llx", disp_list ? "disp" : "free", fb->status, list->fb_list[list->read_idx].poc, list->fb_list[list->read_idx].vdec_fb_va); list->read_idx = (list->read_idx == H264_MAX_FB_NUM - 1) ? 0 : list->read_idx + 1; list->count--; } static int vdec_h264_get_param(void *h_vdec, enum vdec_get_param_type type, void *out) { struct vdec_h264_inst *inst = (struct vdec_h264_inst *)h_vdec; switch (type) { case GET_PARAM_DISP_FRAME_BUFFER: vdec_h264_get_fb(inst, &inst->vsi->list_disp, true, out); break; case GET_PARAM_FREE_FRAME_BUFFER: vdec_h264_get_fb(inst, &inst->vsi->list_free, false, out); break; case GET_PARAM_PIC_INFO: get_pic_info(inst, out); break; case GET_PARAM_DPB_SIZE: get_dpb_size(inst, out); break; case GET_PARAM_CROP_INFO: get_crop_info(inst, out); break; default: mtk_vcodec_err(inst, "invalid get parameter type=%d", type); return -EINVAL; } return 0; } const struct vdec_common_if vdec_h264_if = { .init = vdec_h264_init, .decode = vdec_h264_decode, .get_param = vdec_h264_get_param, .deinit = vdec_h264_deinit, };