2 * Copyright (c) 2016 MediaTek Inc.
3 * Author: Jungchang Tsao <jungchang.tsao@mediatek.com>
4 * Daniel Hsiao <daniel.hsiao@mediatek.com>
5 * PoChun Lin <pochun.lin@mediatek.com>
7 * This program is free software; you can redistribute it and/or
9 * it under the terms of the GNU General Public License version 2 as
10 * published by the Free Software Foundation.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
18 #include <linux/interrupt.h>
19 #include <linux/kernel.h>
20 #include <linux/slab.h>
22 #include "../mtk_vcodec_drv.h"
23 #include "../mtk_vcodec_util.h"
24 #include "../mtk_vcodec_intr.h"
25 #include "../mtk_vcodec_enc.h"
26 #include "../mtk_vcodec_enc_pm.h"
27 #include "../venc_drv_base.h"
28 #include "../venc_ipi_msg.h"
29 #include "../venc_vpu_if.h"
32 static const char h264_filler_marker
[] = {0x0, 0x0, 0x0, 0x1, 0xc};
34 #define H264_FILLER_MARKER_SIZE ARRAY_SIZE(h264_filler_marker)
35 #define VENC_PIC_BITSTREAM_BYTE_CNT 0x0098
38 * enum venc_h264_vpu_work_buf - h264 encoder buffer index
40 enum venc_h264_vpu_work_buf
{
41 VENC_H264_VPU_WORK_BUF_RC_INFO
,
42 VENC_H264_VPU_WORK_BUF_RC_CODE
,
43 VENC_H264_VPU_WORK_BUF_REC_LUMA
,
44 VENC_H264_VPU_WORK_BUF_REC_CHROMA
,
45 VENC_H264_VPU_WORK_BUF_REF_LUMA
,
46 VENC_H264_VPU_WORK_BUF_REF_CHROMA
,
47 VENC_H264_VPU_WORK_BUF_MV_INFO_1
,
48 VENC_H264_VPU_WORK_BUF_MV_INFO_2
,
49 VENC_H264_VPU_WORK_BUF_SKIP_FRAME
,
50 VENC_H264_VPU_WORK_BUF_MAX
,
54 * enum venc_h264_bs_mode - for bs_mode argument in h264_enc_vpu_encode
56 enum venc_h264_bs_mode
{
63 * struct venc_h264_vpu_config - Structure for h264 encoder configuration
64 * AP-W/R : AP is writer/reader on this item
65 * VPU-W/R: VPU is write/reader on this item
66 * @input_fourcc: input fourcc
67 * @bitrate: target bitrate (in bps)
68 * @pic_w: picture width. Picture size is visible stream resolution, in pixels,
69 * to be used for display purposes; must be smaller or equal to buffer
71 * @pic_h: picture height
72 * @buf_w: buffer width. Buffer size is stream resolution in pixels aligned to
73 * hardware requirements.
74 * @buf_h: buffer height
75 * @gop_size: group of picture size (idr frame)
76 * @intra_period: intra frame period
77 * @framerate: frame rate in fps
78 * @profile: as specified in standard
79 * @level: as specified in standard
80 * @wfd: WFD mode 1:on, 0:off
82 struct venc_h264_vpu_config
{
98 * struct venc_h264_vpu_buf - Structure for buffer information
99 * AP-W/R : AP is writer/reader on this item
100 * VPU-W/R: VPU is write/reader on this item
101 * @iova: IO virtual address
102 * @vpua: VPU side memory addr which is used by RC_CODE
103 * @size: buffer size (in bytes)
105 struct venc_h264_vpu_buf
{
112 * struct venc_h264_vsi - Structure for VPU driver control and info share
113 * AP-W/R : AP is writer/reader on this item
114 * VPU-W/R: VPU is write/reader on this item
115 * This structure is allocated in VPU side and shared to AP side.
116 * @config: h264 encoder configuration
117 * @work_bufs: working buffer information in VPU side
118 * The work_bufs here is for storing the 'size' info shared to AP side.
119 * The similar item in struct venc_h264_inst is for memory allocation
120 * in AP side. The AP driver will copy the 'size' from here to the one in
121 * struct mtk_vcodec_mem, then invoke mtk_vcodec_mem_alloc to allocate
122 * the buffer. After that, bypass the 'dma_addr' to the 'iova' field here for
123 * register setting in VPU side.
125 struct venc_h264_vsi
{
126 struct venc_h264_vpu_config config
;
127 struct venc_h264_vpu_buf work_bufs
[VENC_H264_VPU_WORK_BUF_MAX
];
131 * struct venc_h264_inst - h264 encoder AP driver instance
132 * @hw_base: h264 encoder hardware register base
133 * @work_bufs: working buffer
134 * @pps_buf: buffer to store the pps bitstream
135 * @work_buf_allocated: working buffer allocated flag
136 * @frm_cnt: encoded frame count
137 * @prepend_hdr: when the v4l2 layer send VENC_SET_PARAM_PREPEND_HEADER cmd
138 * through h264_enc_set_param interface, it will set this flag and prepend the
139 * sps/pps in h264_enc_encode function.
140 * @vpu_inst: VPU instance to exchange information between AP and VPU
141 * @vsi: driver structure allocated by VPU side and shared to AP side for
142 * control and info share
143 * @ctx: context for v4l2 layer integration
145 struct venc_h264_inst
{
146 void __iomem
*hw_base
;
147 struct mtk_vcodec_mem work_bufs
[VENC_H264_VPU_WORK_BUF_MAX
];
148 struct mtk_vcodec_mem pps_buf
;
149 bool work_buf_allocated
;
150 unsigned int frm_cnt
;
151 unsigned int prepend_hdr
;
152 struct venc_vpu_inst vpu_inst
;
153 struct venc_h264_vsi
*vsi
;
154 struct mtk_vcodec_ctx
*ctx
;
157 static inline u32
h264_read_reg(struct venc_h264_inst
*inst
, u32 addr
)
159 return readl(inst
->hw_base
+ addr
);
162 static unsigned int h264_get_profile(struct venc_h264_inst
*inst
,
163 unsigned int profile
)
166 case V4L2_MPEG_VIDEO_H264_PROFILE_BASELINE
:
168 case V4L2_MPEG_VIDEO_H264_PROFILE_MAIN
:
170 case V4L2_MPEG_VIDEO_H264_PROFILE_HIGH
:
172 case V4L2_MPEG_VIDEO_H264_PROFILE_CONSTRAINED_BASELINE
:
173 mtk_vcodec_err(inst
, "unsupported CONSTRAINED_BASELINE");
175 case V4L2_MPEG_VIDEO_H264_PROFILE_EXTENDED
:
176 mtk_vcodec_err(inst
, "unsupported EXTENDED");
179 mtk_vcodec_debug(inst
, "unsupported profile %d", profile
);
184 static unsigned int h264_get_level(struct venc_h264_inst
*inst
,
188 case V4L2_MPEG_VIDEO_H264_LEVEL_1B
:
189 mtk_vcodec_err(inst
, "unsupported 1B");
191 case V4L2_MPEG_VIDEO_H264_LEVEL_1_0
:
193 case V4L2_MPEG_VIDEO_H264_LEVEL_1_1
:
195 case V4L2_MPEG_VIDEO_H264_LEVEL_1_2
:
197 case V4L2_MPEG_VIDEO_H264_LEVEL_1_3
:
199 case V4L2_MPEG_VIDEO_H264_LEVEL_2_0
:
201 case V4L2_MPEG_VIDEO_H264_LEVEL_2_1
:
203 case V4L2_MPEG_VIDEO_H264_LEVEL_2_2
:
205 case V4L2_MPEG_VIDEO_H264_LEVEL_3_0
:
207 case V4L2_MPEG_VIDEO_H264_LEVEL_3_1
:
209 case V4L2_MPEG_VIDEO_H264_LEVEL_3_2
:
211 case V4L2_MPEG_VIDEO_H264_LEVEL_4_0
:
213 case V4L2_MPEG_VIDEO_H264_LEVEL_4_1
:
215 case V4L2_MPEG_VIDEO_H264_LEVEL_4_2
:
218 mtk_vcodec_debug(inst
, "unsupported level %d", level
);
223 static void h264_enc_free_work_buf(struct venc_h264_inst
*inst
)
227 mtk_vcodec_debug_enter(inst
);
229 /* Except the SKIP_FRAME buffers,
230 * other buffers need to be freed by AP.
232 for (i
= 0; i
< VENC_H264_VPU_WORK_BUF_MAX
; i
++) {
233 if (i
!= VENC_H264_VPU_WORK_BUF_SKIP_FRAME
)
234 mtk_vcodec_mem_free(inst
->ctx
, &inst
->work_bufs
[i
]);
237 mtk_vcodec_mem_free(inst
->ctx
, &inst
->pps_buf
);
239 mtk_vcodec_debug_leave(inst
);
242 static int h264_enc_alloc_work_buf(struct venc_h264_inst
*inst
)
246 struct venc_h264_vpu_buf
*wb
= inst
->vsi
->work_bufs
;
248 mtk_vcodec_debug_enter(inst
);
250 for (i
= 0; i
< VENC_H264_VPU_WORK_BUF_MAX
; i
++) {
252 * This 'wb' structure is set by VPU side and shared to AP for
253 * buffer allocation and IO virtual addr mapping. For most of
254 * the buffers, AP will allocate the buffer according to 'size'
255 * field and store the IO virtual addr in 'iova' field. There
256 * are two exceptions:
257 * (1) RC_CODE buffer, it's pre-allocated in the VPU side, and
258 * save the VPU addr in the 'vpua' field. The AP will translate
259 * the VPU addr to the corresponding IO virtual addr and store
260 * in 'iova' field for reg setting in VPU side.
261 * (2) SKIP_FRAME buffer, it's pre-allocated in the VPU side,
262 * and save the VPU addr in the 'vpua' field. The AP will
263 * translate the VPU addr to the corresponding AP side virtual
264 * address and do some memcpy access to move to bitstream buffer
265 * assigned by v4l2 layer.
267 inst
->work_bufs
[i
].size
= wb
[i
].size
;
268 if (i
== VENC_H264_VPU_WORK_BUF_SKIP_FRAME
) {
269 inst
->work_bufs
[i
].va
= vpu_mapping_dm_addr(
270 inst
->vpu_inst
.dev
, wb
[i
].vpua
);
271 inst
->work_bufs
[i
].dma_addr
= 0;
273 ret
= mtk_vcodec_mem_alloc(inst
->ctx
,
274 &inst
->work_bufs
[i
]);
277 "cannot allocate buf %d", i
);
281 * This RC_CODE is pre-allocated by VPU and saved in VPU
282 * addr. So we need use memcpy to copy RC_CODE from VPU
283 * addr into IO virtual addr in 'iova' field for reg
284 * setting in VPU side.
286 if (i
== VENC_H264_VPU_WORK_BUF_RC_CODE
) {
289 tmp_va
= vpu_mapping_dm_addr(inst
->vpu_inst
.dev
,
291 memcpy(inst
->work_bufs
[i
].va
, tmp_va
,
295 wb
[i
].iova
= inst
->work_bufs
[i
].dma_addr
;
297 mtk_vcodec_debug(inst
,
298 "work_buf[%d] va=0x%p iova=%pad size=%zu",
299 i
, inst
->work_bufs
[i
].va
,
300 &inst
->work_bufs
[i
].dma_addr
,
301 inst
->work_bufs
[i
].size
);
304 /* the pps_buf is used by AP side only */
305 inst
->pps_buf
.size
= 128;
306 ret
= mtk_vcodec_mem_alloc(inst
->ctx
, &inst
->pps_buf
);
308 mtk_vcodec_err(inst
, "cannot allocate pps_buf");
312 mtk_vcodec_debug_leave(inst
);
317 h264_enc_free_work_buf(inst
);
322 static unsigned int h264_enc_wait_venc_done(struct venc_h264_inst
*inst
)
324 unsigned int irq_status
= 0;
325 struct mtk_vcodec_ctx
*ctx
= (struct mtk_vcodec_ctx
*)inst
->ctx
;
327 if (!mtk_vcodec_wait_for_done_ctx(ctx
, MTK_INST_IRQ_RECEIVED
,
328 WAIT_INTR_TIMEOUT_MS
)) {
329 irq_status
= ctx
->irq_status
;
330 mtk_vcodec_debug(inst
, "irq_status %x <-", irq_status
);
335 static int h264_encode_sps(struct venc_h264_inst
*inst
,
336 struct mtk_vcodec_mem
*bs_buf
,
337 unsigned int *bs_size
)
340 unsigned int irq_status
;
342 mtk_vcodec_debug_enter(inst
);
344 ret
= vpu_enc_encode(&inst
->vpu_inst
, H264_BS_MODE_SPS
, NULL
,
349 irq_status
= h264_enc_wait_venc_done(inst
);
350 if (irq_status
!= MTK_VENC_IRQ_STATUS_SPS
) {
351 mtk_vcodec_err(inst
, "expect irq status %d",
352 MTK_VENC_IRQ_STATUS_SPS
);
356 *bs_size
= h264_read_reg(inst
, VENC_PIC_BITSTREAM_BYTE_CNT
);
357 mtk_vcodec_debug(inst
, "bs size %d <-", *bs_size
);
362 static int h264_encode_pps(struct venc_h264_inst
*inst
,
363 struct mtk_vcodec_mem
*bs_buf
,
364 unsigned int *bs_size
)
367 unsigned int irq_status
;
369 mtk_vcodec_debug_enter(inst
);
371 ret
= vpu_enc_encode(&inst
->vpu_inst
, H264_BS_MODE_PPS
, NULL
,
376 irq_status
= h264_enc_wait_venc_done(inst
);
377 if (irq_status
!= MTK_VENC_IRQ_STATUS_PPS
) {
378 mtk_vcodec_err(inst
, "expect irq status %d",
379 MTK_VENC_IRQ_STATUS_PPS
);
383 *bs_size
= h264_read_reg(inst
, VENC_PIC_BITSTREAM_BYTE_CNT
);
384 mtk_vcodec_debug(inst
, "bs size %d <-", *bs_size
);
389 static int h264_encode_header(struct venc_h264_inst
*inst
,
390 struct mtk_vcodec_mem
*bs_buf
,
391 unsigned int *bs_size
)
394 unsigned int bs_size_sps
;
395 unsigned int bs_size_pps
;
397 ret
= h264_encode_sps(inst
, bs_buf
, &bs_size_sps
);
401 ret
= h264_encode_pps(inst
, &inst
->pps_buf
, &bs_size_pps
);
405 memcpy(bs_buf
->va
+ bs_size_sps
, inst
->pps_buf
.va
, bs_size_pps
);
406 *bs_size
= bs_size_sps
+ bs_size_pps
;
411 static int h264_encode_frame(struct venc_h264_inst
*inst
,
412 struct venc_frm_buf
*frm_buf
,
413 struct mtk_vcodec_mem
*bs_buf
,
414 unsigned int *bs_size
)
417 unsigned int irq_status
;
419 mtk_vcodec_debug_enter(inst
);
421 ret
= vpu_enc_encode(&inst
->vpu_inst
, H264_BS_MODE_FRAME
, frm_buf
,
427 * skip frame case: The skip frame buffer is composed by vpu side only,
428 * it does not trigger the hw, so skip the wait interrupt operation.
430 if (inst
->vpu_inst
.state
== VEN_IPI_MSG_ENC_STATE_SKIP
) {
431 *bs_size
= inst
->vpu_inst
.bs_size
;
433 inst
->work_bufs
[VENC_H264_VPU_WORK_BUF_SKIP_FRAME
].va
,
439 irq_status
= h264_enc_wait_venc_done(inst
);
440 if (irq_status
!= MTK_VENC_IRQ_STATUS_FRM
) {
441 mtk_vcodec_err(inst
, "irq_status=%d failed", irq_status
);
445 *bs_size
= h264_read_reg(inst
, VENC_PIC_BITSTREAM_BYTE_CNT
);
448 mtk_vcodec_debug(inst
, "frm %d bs_size %d key_frm %d <-",
449 inst
->frm_cnt
, *bs_size
, inst
->vpu_inst
.is_key_frm
);
454 static void h264_encode_filler(struct venc_h264_inst
*inst
, void *buf
,
457 unsigned char *p
= buf
;
459 if (size
< H264_FILLER_MARKER_SIZE
) {
460 mtk_vcodec_err(inst
, "filler size too small %d", size
);
464 memcpy(p
, h264_filler_marker
, ARRAY_SIZE(h264_filler_marker
));
465 size
-= H264_FILLER_MARKER_SIZE
;
466 p
+= H264_FILLER_MARKER_SIZE
;
467 memset(p
, 0xff, size
);
470 static int h264_enc_init(struct mtk_vcodec_ctx
*ctx
, unsigned long *handle
)
473 struct venc_h264_inst
*inst
;
475 inst
= kzalloc(sizeof(*inst
), GFP_KERNEL
);
480 inst
->vpu_inst
.ctx
= ctx
;
481 inst
->vpu_inst
.dev
= ctx
->dev
->vpu_plat_dev
;
482 inst
->vpu_inst
.id
= IPI_VENC_H264
;
483 inst
->hw_base
= mtk_vcodec_get_reg_addr(inst
->ctx
, VENC_SYS
);
485 mtk_vcodec_debug_enter(inst
);
487 ret
= vpu_enc_init(&inst
->vpu_inst
);
489 inst
->vsi
= (struct venc_h264_vsi
*)inst
->vpu_inst
.vsi
;
491 mtk_vcodec_debug_leave(inst
);
496 (*handle
) = (unsigned long)inst
;
501 static int h264_enc_encode(unsigned long handle
,
502 enum venc_start_opt opt
,
503 struct venc_frm_buf
*frm_buf
,
504 struct mtk_vcodec_mem
*bs_buf
,
505 struct venc_done_result
*result
)
508 struct venc_h264_inst
*inst
= (struct venc_h264_inst
*)handle
;
509 struct mtk_vcodec_ctx
*ctx
= inst
->ctx
;
511 mtk_vcodec_debug(inst
, "opt %d ->", opt
);
513 enable_irq(ctx
->dev
->enc_irq
);
516 case VENC_START_OPT_ENCODE_SEQUENCE_HEADER
: {
517 unsigned int bs_size_hdr
;
519 ret
= h264_encode_header(inst
, bs_buf
, &bs_size_hdr
);
523 result
->bs_size
= bs_size_hdr
;
524 result
->is_key_frm
= false;
528 case VENC_START_OPT_ENCODE_FRAME
: {
532 const int bs_alignment
= 128;
533 struct mtk_vcodec_mem tmp_bs_buf
;
534 unsigned int bs_size_hdr
;
535 unsigned int bs_size_frm
;
537 if (!inst
->prepend_hdr
) {
538 ret
= h264_encode_frame(inst
, frm_buf
, bs_buf
,
542 result
->is_key_frm
= inst
->vpu_inst
.is_key_frm
;
546 mtk_vcodec_debug(inst
, "h264_encode_frame prepend SPS/PPS");
548 ret
= h264_encode_header(inst
, bs_buf
, &bs_size_hdr
);
552 hdr_sz
= bs_size_hdr
;
553 hdr_sz_ext
= (hdr_sz
& (bs_alignment
- 1));
555 filler_sz
= bs_alignment
- hdr_sz_ext
;
556 if (hdr_sz_ext
+ H264_FILLER_MARKER_SIZE
> bs_alignment
)
557 filler_sz
+= bs_alignment
;
558 h264_encode_filler(inst
, bs_buf
->va
+ hdr_sz
,
562 tmp_bs_buf
.va
= bs_buf
->va
+ hdr_sz
+ filler_sz
;
563 tmp_bs_buf
.dma_addr
= bs_buf
->dma_addr
+ hdr_sz
+ filler_sz
;
564 tmp_bs_buf
.size
= bs_buf
->size
- (hdr_sz
+ filler_sz
);
566 ret
= h264_encode_frame(inst
, frm_buf
, &tmp_bs_buf
,
571 result
->bs_size
= hdr_sz
+ filler_sz
+ bs_size_frm
;
573 mtk_vcodec_debug(inst
, "hdr %d filler %d frame %d bs %d",
574 hdr_sz
, filler_sz
, bs_size_frm
,
577 inst
->prepend_hdr
= 0;
578 result
->is_key_frm
= inst
->vpu_inst
.is_key_frm
;
583 mtk_vcodec_err(inst
, "venc_start_opt %d not supported", opt
);
590 disable_irq(ctx
->dev
->enc_irq
);
591 mtk_vcodec_debug(inst
, "opt %d <-", opt
);
596 static int h264_enc_set_param(unsigned long handle
,
597 enum venc_set_param_type type
,
598 struct venc_enc_param
*enc_prm
)
601 struct venc_h264_inst
*inst
= (struct venc_h264_inst
*)handle
;
603 mtk_vcodec_debug(inst
, "->type=%d", type
);
606 case VENC_SET_PARAM_ENC
:
607 inst
->vsi
->config
.input_fourcc
= enc_prm
->input_yuv_fmt
;
608 inst
->vsi
->config
.bitrate
= enc_prm
->bitrate
;
609 inst
->vsi
->config
.pic_w
= enc_prm
->width
;
610 inst
->vsi
->config
.pic_h
= enc_prm
->height
;
611 inst
->vsi
->config
.buf_w
= enc_prm
->buf_width
;
612 inst
->vsi
->config
.buf_h
= enc_prm
->buf_height
;
613 inst
->vsi
->config
.gop_size
= enc_prm
->gop_size
;
614 inst
->vsi
->config
.framerate
= enc_prm
->frm_rate
;
615 inst
->vsi
->config
.intra_period
= enc_prm
->intra_period
;
616 inst
->vsi
->config
.profile
=
617 h264_get_profile(inst
, enc_prm
->h264_profile
);
618 inst
->vsi
->config
.level
=
619 h264_get_level(inst
, enc_prm
->h264_level
);
620 inst
->vsi
->config
.wfd
= 0;
621 ret
= vpu_enc_set_param(&inst
->vpu_inst
, type
, enc_prm
);
624 if (inst
->work_buf_allocated
) {
625 h264_enc_free_work_buf(inst
);
626 inst
->work_buf_allocated
= false;
628 ret
= h264_enc_alloc_work_buf(inst
);
631 inst
->work_buf_allocated
= true;
634 case VENC_SET_PARAM_PREPEND_HEADER
:
635 inst
->prepend_hdr
= 1;
636 mtk_vcodec_debug(inst
, "set prepend header mode");
640 ret
= vpu_enc_set_param(&inst
->vpu_inst
, type
, enc_prm
);
644 mtk_vcodec_debug_leave(inst
);
649 static int h264_enc_deinit(unsigned long handle
)
652 struct venc_h264_inst
*inst
= (struct venc_h264_inst
*)handle
;
654 mtk_vcodec_debug_enter(inst
);
656 ret
= vpu_enc_deinit(&inst
->vpu_inst
);
658 if (inst
->work_buf_allocated
)
659 h264_enc_free_work_buf(inst
);
661 mtk_vcodec_debug_leave(inst
);
667 static const struct venc_common_if venc_h264_if
= {
668 .init
= h264_enc_init
,
669 .encode
= h264_enc_encode
,
670 .set_param
= h264_enc_set_param
,
671 .deinit
= h264_enc_deinit
,
674 const struct venc_common_if
*get_h264_enc_comm_if(void);
676 const struct venc_common_if
*get_h264_enc_comm_if(void)
678 return &venc_h264_if
;