2 * Copyright (c) 2016 MediaTek Inc.
3 * Author: Jungchang Tsao <jungchang.tsao@mediatek.com>
4 * Daniel Hsiao <daniel.hsiao@mediatek.com>
5 * PoChun Lin <pochun.lin@mediatek.com>
7 * This program is free software; you can redistribute it and/or
9 * it under the terms of the GNU General Public License version 2 as
10 * published by the Free Software Foundation.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
18 #include <linux/interrupt.h>
19 #include <linux/kernel.h>
20 #include <linux/slab.h>
22 #include "../mtk_vcodec_drv.h"
23 #include "../mtk_vcodec_util.h"
24 #include "../mtk_vcodec_intr.h"
25 #include "../mtk_vcodec_enc.h"
26 #include "../mtk_vcodec_enc_pm.h"
27 #include "../venc_drv_base.h"
28 #include "../venc_ipi_msg.h"
29 #include "../venc_vpu_if.h"
32 static const char h264_filler_marker[] = {0x0, 0x0, 0x0, 0x1, 0xc};
34 #define H264_FILLER_MARKER_SIZE ARRAY_SIZE(h264_filler_marker)
35 #define VENC_PIC_BITSTREAM_BYTE_CNT 0x0098
38 * enum venc_h264_vpu_work_buf - h264 encoder buffer index
40 enum venc_h264_vpu_work_buf {
41 VENC_H264_VPU_WORK_BUF_RC_INFO,
42 VENC_H264_VPU_WORK_BUF_RC_CODE,
43 VENC_H264_VPU_WORK_BUF_REC_LUMA,
44 VENC_H264_VPU_WORK_BUF_REC_CHROMA,
45 VENC_H264_VPU_WORK_BUF_REF_LUMA,
46 VENC_H264_VPU_WORK_BUF_REF_CHROMA,
47 VENC_H264_VPU_WORK_BUF_MV_INFO_1,
48 VENC_H264_VPU_WORK_BUF_MV_INFO_2,
49 VENC_H264_VPU_WORK_BUF_SKIP_FRAME,
50 VENC_H264_VPU_WORK_BUF_MAX,
54 * enum venc_h264_bs_mode - for bs_mode argument in h264_enc_vpu_encode
56 enum venc_h264_bs_mode {
63 * struct venc_h264_vpu_config - Structure for h264 encoder configuration
64 * AP-W/R : AP is writer/reader on this item
65 * VPU-W/R: VPU is write/reader on this item
66 * @input_fourcc: input fourcc
67 * @bitrate: target bitrate (in bps)
68 * @pic_w: picture width. Picture size is visible stream resolution, in pixels,
69 * to be used for display purposes; must be smaller or equal to buffer
71 * @pic_h: picture height
72 * @buf_w: buffer width. Buffer size is stream resolution in pixels aligned to
73 * hardware requirements.
74 * @buf_h: buffer height
75 * @gop_size: group of picture size (idr frame)
76 * @intra_period: intra frame period
77 * @framerate: frame rate in fps
78 * @profile: as specified in standard
79 * @level: as specified in standard
80 * @wfd: WFD mode 1:on, 0:off
82 struct venc_h264_vpu_config {
98 * struct venc_h264_vpu_buf - Structure for buffer information
99 * AP-W/R : AP is writer/reader on this item
100 * VPU-W/R: VPU is write/reader on this item
101 * @iova: IO virtual address
102 * @vpua: VPU side memory addr which is used by RC_CODE
103 * @size: buffer size (in bytes)
105 struct venc_h264_vpu_buf {
112 * struct venc_h264_vsi - Structure for VPU driver control and info share
113 * AP-W/R : AP is writer/reader on this item
114 * VPU-W/R: VPU is write/reader on this item
115 * This structure is allocated in VPU side and shared to AP side.
116 * @config: h264 encoder configuration
117 * @work_bufs: working buffer information in VPU side
118 * The work_bufs here is for storing the 'size' info shared to AP side.
119 * The similar item in struct venc_h264_inst is for memory allocation
120 * in AP side. The AP driver will copy the 'size' from here to the one in
121 * struct mtk_vcodec_mem, then invoke mtk_vcodec_mem_alloc to allocate
122 * the buffer. After that, bypass the 'dma_addr' to the 'iova' field here for
123 * register setting in VPU side.
125 struct venc_h264_vsi {
126 struct venc_h264_vpu_config config;
127 struct venc_h264_vpu_buf work_bufs[VENC_H264_VPU_WORK_BUF_MAX];
131 * struct venc_h264_inst - h264 encoder AP driver instance
132 * @hw_base: h264 encoder hardware register base
133 * @work_bufs: working buffer
134 * @pps_buf: buffer to store the pps bitstream
135 * @work_buf_allocated: working buffer allocated flag
136 * @frm_cnt: encoded frame count
137 * @prepend_hdr: when the v4l2 layer send VENC_SET_PARAM_PREPEND_HEADER cmd
138 * through h264_enc_set_param interface, it will set this flag and prepend the
139 * sps/pps in h264_enc_encode function.
140 * @vpu_inst: VPU instance to exchange information between AP and VPU
141 * @vsi: driver structure allocated by VPU side and shared to AP side for
142 * control and info share
143 * @ctx: context for v4l2 layer integration
145 struct venc_h264_inst {
146 void __iomem *hw_base;
147 struct mtk_vcodec_mem work_bufs[VENC_H264_VPU_WORK_BUF_MAX];
148 struct mtk_vcodec_mem pps_buf;
149 bool work_buf_allocated;
150 unsigned int frm_cnt;
151 unsigned int prepend_hdr;
152 struct venc_vpu_inst vpu_inst;
153 struct venc_h264_vsi *vsi;
154 struct mtk_vcodec_ctx *ctx;
157 static inline u32 h264_read_reg(struct venc_h264_inst *inst, u32 addr)
159 return readl(inst->hw_base + addr);
162 static unsigned int h264_get_profile(struct venc_h264_inst *inst,
163 unsigned int profile)
166 case V4L2_MPEG_VIDEO_H264_PROFILE_BASELINE:
168 case V4L2_MPEG_VIDEO_H264_PROFILE_MAIN:
170 case V4L2_MPEG_VIDEO_H264_PROFILE_HIGH:
172 case V4L2_MPEG_VIDEO_H264_PROFILE_CONSTRAINED_BASELINE:
173 mtk_vcodec_err(inst, "unsupported CONSTRAINED_BASELINE");
175 case V4L2_MPEG_VIDEO_H264_PROFILE_EXTENDED:
176 mtk_vcodec_err(inst, "unsupported EXTENDED");
179 mtk_vcodec_debug(inst, "unsupported profile %d", profile);
184 static unsigned int h264_get_level(struct venc_h264_inst *inst,
188 case V4L2_MPEG_VIDEO_H264_LEVEL_1B:
189 mtk_vcodec_err(inst, "unsupported 1B");
191 case V4L2_MPEG_VIDEO_H264_LEVEL_1_0:
193 case V4L2_MPEG_VIDEO_H264_LEVEL_1_1:
195 case V4L2_MPEG_VIDEO_H264_LEVEL_1_2:
197 case V4L2_MPEG_VIDEO_H264_LEVEL_1_3:
199 case V4L2_MPEG_VIDEO_H264_LEVEL_2_0:
201 case V4L2_MPEG_VIDEO_H264_LEVEL_2_1:
203 case V4L2_MPEG_VIDEO_H264_LEVEL_2_2:
205 case V4L2_MPEG_VIDEO_H264_LEVEL_3_0:
207 case V4L2_MPEG_VIDEO_H264_LEVEL_3_1:
209 case V4L2_MPEG_VIDEO_H264_LEVEL_3_2:
211 case V4L2_MPEG_VIDEO_H264_LEVEL_4_0:
213 case V4L2_MPEG_VIDEO_H264_LEVEL_4_1:
215 case V4L2_MPEG_VIDEO_H264_LEVEL_4_2:
218 mtk_vcodec_debug(inst, "unsupported level %d", level);
223 static void h264_enc_free_work_buf(struct venc_h264_inst *inst)
227 mtk_vcodec_debug_enter(inst);
229 /* Except the SKIP_FRAME buffers,
230 * other buffers need to be freed by AP.
232 for (i = 0; i < VENC_H264_VPU_WORK_BUF_MAX; i++) {
233 if (i != VENC_H264_VPU_WORK_BUF_SKIP_FRAME)
234 mtk_vcodec_mem_free(inst->ctx, &inst->work_bufs[i]);
237 mtk_vcodec_mem_free(inst->ctx, &inst->pps_buf);
239 mtk_vcodec_debug_leave(inst);
242 static int h264_enc_alloc_work_buf(struct venc_h264_inst *inst)
246 struct venc_h264_vpu_buf *wb = inst->vsi->work_bufs;
248 mtk_vcodec_debug_enter(inst);
250 for (i = 0; i < VENC_H264_VPU_WORK_BUF_MAX; i++) {
252 * This 'wb' structure is set by VPU side and shared to AP for
253 * buffer allocation and IO virtual addr mapping. For most of
254 * the buffers, AP will allocate the buffer according to 'size'
255 * field and store the IO virtual addr in 'iova' field. There
256 * are two exceptions:
257 * (1) RC_CODE buffer, it's pre-allocated in the VPU side, and
258 * save the VPU addr in the 'vpua' field. The AP will translate
259 * the VPU addr to the corresponding IO virtual addr and store
260 * in 'iova' field for reg setting in VPU side.
261 * (2) SKIP_FRAME buffer, it's pre-allocated in the VPU side,
262 * and save the VPU addr in the 'vpua' field. The AP will
263 * translate the VPU addr to the corresponding AP side virtual
264 * address and do some memcpy access to move to bitstream buffer
265 * assigned by v4l2 layer.
267 inst->work_bufs[i].size = wb[i].size;
268 if (i == VENC_H264_VPU_WORK_BUF_SKIP_FRAME) {
269 inst->work_bufs[i].va = vpu_mapping_dm_addr(
270 inst->vpu_inst.dev, wb[i].vpua);
271 inst->work_bufs[i].dma_addr = 0;
273 ret = mtk_vcodec_mem_alloc(inst->ctx,
274 &inst->work_bufs[i]);
277 "cannot allocate buf %d", i);
281 * This RC_CODE is pre-allocated by VPU and saved in VPU
282 * addr. So we need use memcpy to copy RC_CODE from VPU
283 * addr into IO virtual addr in 'iova' field for reg
284 * setting in VPU side.
286 if (i == VENC_H264_VPU_WORK_BUF_RC_CODE) {
289 tmp_va = vpu_mapping_dm_addr(inst->vpu_inst.dev,
291 memcpy(inst->work_bufs[i].va, tmp_va,
295 wb[i].iova = inst->work_bufs[i].dma_addr;
297 mtk_vcodec_debug(inst,
298 "work_buf[%d] va=0x%p iova=%pad size=%zu",
299 i, inst->work_bufs[i].va,
300 &inst->work_bufs[i].dma_addr,
301 inst->work_bufs[i].size);
304 /* the pps_buf is used by AP side only */
305 inst->pps_buf.size = 128;
306 ret = mtk_vcodec_mem_alloc(inst->ctx, &inst->pps_buf);
308 mtk_vcodec_err(inst, "cannot allocate pps_buf");
312 mtk_vcodec_debug_leave(inst);
317 h264_enc_free_work_buf(inst);
322 static unsigned int h264_enc_wait_venc_done(struct venc_h264_inst *inst)
324 unsigned int irq_status = 0;
325 struct mtk_vcodec_ctx *ctx = (struct mtk_vcodec_ctx *)inst->ctx;
327 if (!mtk_vcodec_wait_for_done_ctx(ctx, MTK_INST_IRQ_RECEIVED,
328 WAIT_INTR_TIMEOUT_MS)) {
329 irq_status = ctx->irq_status;
330 mtk_vcodec_debug(inst, "irq_status %x <-", irq_status);
335 static int h264_encode_sps(struct venc_h264_inst *inst,
336 struct mtk_vcodec_mem *bs_buf,
337 unsigned int *bs_size)
340 unsigned int irq_status;
342 mtk_vcodec_debug_enter(inst);
344 ret = vpu_enc_encode(&inst->vpu_inst, H264_BS_MODE_SPS, NULL,
349 irq_status = h264_enc_wait_venc_done(inst);
350 if (irq_status != MTK_VENC_IRQ_STATUS_SPS) {
351 mtk_vcodec_err(inst, "expect irq status %d",
352 MTK_VENC_IRQ_STATUS_SPS);
356 *bs_size = h264_read_reg(inst, VENC_PIC_BITSTREAM_BYTE_CNT);
357 mtk_vcodec_debug(inst, "bs size %d <-", *bs_size);
362 static int h264_encode_pps(struct venc_h264_inst *inst,
363 struct mtk_vcodec_mem *bs_buf,
364 unsigned int *bs_size)
367 unsigned int irq_status;
369 mtk_vcodec_debug_enter(inst);
371 ret = vpu_enc_encode(&inst->vpu_inst, H264_BS_MODE_PPS, NULL,
376 irq_status = h264_enc_wait_venc_done(inst);
377 if (irq_status != MTK_VENC_IRQ_STATUS_PPS) {
378 mtk_vcodec_err(inst, "expect irq status %d",
379 MTK_VENC_IRQ_STATUS_PPS);
383 *bs_size = h264_read_reg(inst, VENC_PIC_BITSTREAM_BYTE_CNT);
384 mtk_vcodec_debug(inst, "bs size %d <-", *bs_size);
389 static int h264_encode_header(struct venc_h264_inst *inst,
390 struct mtk_vcodec_mem *bs_buf,
391 unsigned int *bs_size)
394 unsigned int bs_size_sps;
395 unsigned int bs_size_pps;
397 ret = h264_encode_sps(inst, bs_buf, &bs_size_sps);
401 ret = h264_encode_pps(inst, &inst->pps_buf, &bs_size_pps);
405 memcpy(bs_buf->va + bs_size_sps, inst->pps_buf.va, bs_size_pps);
406 *bs_size = bs_size_sps + bs_size_pps;
411 static int h264_encode_frame(struct venc_h264_inst *inst,
412 struct venc_frm_buf *frm_buf,
413 struct mtk_vcodec_mem *bs_buf,
414 unsigned int *bs_size)
417 unsigned int irq_status;
419 mtk_vcodec_debug_enter(inst);
421 ret = vpu_enc_encode(&inst->vpu_inst, H264_BS_MODE_FRAME, frm_buf,
427 * skip frame case: The skip frame buffer is composed by vpu side only,
428 * it does not trigger the hw, so skip the wait interrupt operation.
430 if (inst->vpu_inst.state == VEN_IPI_MSG_ENC_STATE_SKIP) {
431 *bs_size = inst->vpu_inst.bs_size;
433 inst->work_bufs[VENC_H264_VPU_WORK_BUF_SKIP_FRAME].va,
439 irq_status = h264_enc_wait_venc_done(inst);
440 if (irq_status != MTK_VENC_IRQ_STATUS_FRM) {
441 mtk_vcodec_err(inst, "irq_status=%d failed", irq_status);
445 *bs_size = h264_read_reg(inst, VENC_PIC_BITSTREAM_BYTE_CNT);
448 mtk_vcodec_debug(inst, "frm %d bs_size %d key_frm %d <-",
449 inst->frm_cnt, *bs_size, inst->vpu_inst.is_key_frm);
454 static void h264_encode_filler(struct venc_h264_inst *inst, void *buf,
457 unsigned char *p = buf;
459 if (size < H264_FILLER_MARKER_SIZE) {
460 mtk_vcodec_err(inst, "filler size too small %d", size);
464 memcpy(p, h264_filler_marker, ARRAY_SIZE(h264_filler_marker));
465 size -= H264_FILLER_MARKER_SIZE;
466 p += H264_FILLER_MARKER_SIZE;
467 memset(p, 0xff, size);
470 static int h264_enc_init(struct mtk_vcodec_ctx *ctx, unsigned long *handle)
473 struct venc_h264_inst *inst;
475 inst = kzalloc(sizeof(*inst), GFP_KERNEL);
480 inst->vpu_inst.ctx = ctx;
481 inst->vpu_inst.dev = ctx->dev->vpu_plat_dev;
482 inst->vpu_inst.id = IPI_VENC_H264;
483 inst->hw_base = mtk_vcodec_get_reg_addr(inst->ctx, VENC_SYS);
485 mtk_vcodec_debug_enter(inst);
487 ret = vpu_enc_init(&inst->vpu_inst);
489 inst->vsi = (struct venc_h264_vsi *)inst->vpu_inst.vsi;
491 mtk_vcodec_debug_leave(inst);
496 (*handle) = (unsigned long)inst;
501 static int h264_enc_encode(unsigned long handle,
502 enum venc_start_opt opt,
503 struct venc_frm_buf *frm_buf,
504 struct mtk_vcodec_mem *bs_buf,
505 struct venc_done_result *result)
508 struct venc_h264_inst *inst = (struct venc_h264_inst *)handle;
509 struct mtk_vcodec_ctx *ctx = inst->ctx;
511 mtk_vcodec_debug(inst, "opt %d ->", opt);
513 enable_irq(ctx->dev->enc_irq);
516 case VENC_START_OPT_ENCODE_SEQUENCE_HEADER: {
517 unsigned int bs_size_hdr;
519 ret = h264_encode_header(inst, bs_buf, &bs_size_hdr);
523 result->bs_size = bs_size_hdr;
524 result->is_key_frm = false;
528 case VENC_START_OPT_ENCODE_FRAME: {
532 const int bs_alignment = 128;
533 struct mtk_vcodec_mem tmp_bs_buf;
534 unsigned int bs_size_hdr;
535 unsigned int bs_size_frm;
537 if (!inst->prepend_hdr) {
538 ret = h264_encode_frame(inst, frm_buf, bs_buf,
542 result->is_key_frm = inst->vpu_inst.is_key_frm;
546 mtk_vcodec_debug(inst, "h264_encode_frame prepend SPS/PPS");
548 ret = h264_encode_header(inst, bs_buf, &bs_size_hdr);
552 hdr_sz = bs_size_hdr;
553 hdr_sz_ext = (hdr_sz & (bs_alignment - 1));
555 filler_sz = bs_alignment - hdr_sz_ext;
556 if (hdr_sz_ext + H264_FILLER_MARKER_SIZE > bs_alignment)
557 filler_sz += bs_alignment;
558 h264_encode_filler(inst, bs_buf->va + hdr_sz,
562 tmp_bs_buf.va = bs_buf->va + hdr_sz + filler_sz;
563 tmp_bs_buf.dma_addr = bs_buf->dma_addr + hdr_sz + filler_sz;
564 tmp_bs_buf.size = bs_buf->size - (hdr_sz + filler_sz);
566 ret = h264_encode_frame(inst, frm_buf, &tmp_bs_buf,
571 result->bs_size = hdr_sz + filler_sz + bs_size_frm;
573 mtk_vcodec_debug(inst, "hdr %d filler %d frame %d bs %d",
574 hdr_sz, filler_sz, bs_size_frm,
577 inst->prepend_hdr = 0;
578 result->is_key_frm = inst->vpu_inst.is_key_frm;
583 mtk_vcodec_err(inst, "venc_start_opt %d not supported", opt);
590 disable_irq(ctx->dev->enc_irq);
591 mtk_vcodec_debug(inst, "opt %d <-", opt);
596 static int h264_enc_set_param(unsigned long handle,
597 enum venc_set_param_type type,
598 struct venc_enc_param *enc_prm)
601 struct venc_h264_inst *inst = (struct venc_h264_inst *)handle;
603 mtk_vcodec_debug(inst, "->type=%d", type);
606 case VENC_SET_PARAM_ENC:
607 inst->vsi->config.input_fourcc = enc_prm->input_yuv_fmt;
608 inst->vsi->config.bitrate = enc_prm->bitrate;
609 inst->vsi->config.pic_w = enc_prm->width;
610 inst->vsi->config.pic_h = enc_prm->height;
611 inst->vsi->config.buf_w = enc_prm->buf_width;
612 inst->vsi->config.buf_h = enc_prm->buf_height;
613 inst->vsi->config.gop_size = enc_prm->gop_size;
614 inst->vsi->config.framerate = enc_prm->frm_rate;
615 inst->vsi->config.intra_period = enc_prm->intra_period;
616 inst->vsi->config.profile =
617 h264_get_profile(inst, enc_prm->h264_profile);
618 inst->vsi->config.level =
619 h264_get_level(inst, enc_prm->h264_level);
620 inst->vsi->config.wfd = 0;
621 ret = vpu_enc_set_param(&inst->vpu_inst, type, enc_prm);
624 if (inst->work_buf_allocated) {
625 h264_enc_free_work_buf(inst);
626 inst->work_buf_allocated = false;
628 ret = h264_enc_alloc_work_buf(inst);
631 inst->work_buf_allocated = true;
634 case VENC_SET_PARAM_PREPEND_HEADER:
635 inst->prepend_hdr = 1;
636 mtk_vcodec_debug(inst, "set prepend header mode");
640 ret = vpu_enc_set_param(&inst->vpu_inst, type, enc_prm);
644 mtk_vcodec_debug_leave(inst);
649 static int h264_enc_deinit(unsigned long handle)
652 struct venc_h264_inst *inst = (struct venc_h264_inst *)handle;
654 mtk_vcodec_debug_enter(inst);
656 ret = vpu_enc_deinit(&inst->vpu_inst);
658 if (inst->work_buf_allocated)
659 h264_enc_free_work_buf(inst);
661 mtk_vcodec_debug_leave(inst);
667 static const struct venc_common_if venc_h264_if = {
674 const struct venc_common_if *get_h264_enc_comm_if(void);
676 const struct venc_common_if *get_h264_enc_comm_if(void)
678 return &venc_h264_if;