1 // SPDX-License-Identifier: GPL-2.0
3 * Hantro G1 post-processor support
5 * Copyright (C) 2019 Collabora, Ltd.
8 #include <linux/dma-mapping.h>
9 #include <linux/types.h>
12 #include "hantro_hw.h"
13 #include "hantro_g1_regs.h"
14 #include "hantro_g2_regs.h"
15 #include "hantro_v4l2.h"
17 #define HANTRO_PP_REG_WRITE(vpu, reg_name, val) \
19 hantro_reg_write(vpu, \
20 &hantro_g1_postproc_regs.reg_name, \
24 #define HANTRO_PP_REG_WRITE_RELAXED(vpu, reg_name, val) \
26 hantro_reg_write_relaxed(vpu, \
27 &hantro_g1_postproc_regs.reg_name, \
31 #define VPU_PP_IN_YUYV 0x0
32 #define VPU_PP_IN_NV12 0x1
33 #define VPU_PP_IN_YUV420 0x2
34 #define VPU_PP_IN_YUV240_TILED 0x5
35 #define VPU_PP_OUT_RGB 0x0
36 #define VPU_PP_OUT_YUYV 0x3
38 static const struct hantro_postproc_regs hantro_g1_postproc_regs
= {
39 .pipeline_en
= {G1_REG_PP_INTERRUPT
, 1, 0x1},
40 .max_burst
= {G1_REG_PP_DEV_CONFIG
, 0, 0x1f},
41 .clk_gate
= {G1_REG_PP_DEV_CONFIG
, 1, 0x1},
42 .out_swap32
= {G1_REG_PP_DEV_CONFIG
, 5, 0x1},
43 .out_endian
= {G1_REG_PP_DEV_CONFIG
, 6, 0x1},
44 .out_luma_base
= {G1_REG_PP_OUT_LUMA_BASE
, 0, 0xffffffff},
45 .input_width
= {G1_REG_PP_INPUT_SIZE
, 0, 0x1ff},
46 .input_height
= {G1_REG_PP_INPUT_SIZE
, 9, 0x1ff},
47 .output_width
= {G1_REG_PP_CONTROL
, 4, 0x7ff},
48 .output_height
= {G1_REG_PP_CONTROL
, 15, 0x7ff},
49 .input_fmt
= {G1_REG_PP_CONTROL
, 29, 0x7},
50 .output_fmt
= {G1_REG_PP_CONTROL
, 26, 0x7},
51 .orig_width
= {G1_REG_PP_MASK1_ORIG_WIDTH
, 23, 0x1ff},
52 .display_width
= {G1_REG_PP_DISPLAY_WIDTH
, 0, 0xfff},
55 bool hantro_needs_postproc(const struct hantro_ctx
*ctx
,
56 const struct hantro_fmt
*fmt
)
61 if (ctx
->need_postproc
)
64 return fmt
->postprocessed
;
67 static void hantro_postproc_g1_enable(struct hantro_ctx
*ctx
)
69 struct hantro_dev
*vpu
= ctx
->dev
;
70 struct vb2_v4l2_buffer
*dst_buf
;
71 u32 src_pp_fmt
, dst_pp_fmt
;
74 /* Turn on pipeline mode. Must be done first. */
75 HANTRO_PP_REG_WRITE(vpu
, pipeline_en
, 0x1);
77 src_pp_fmt
= VPU_PP_IN_NV12
;
79 switch (ctx
->vpu_dst_fmt
->fourcc
) {
80 case V4L2_PIX_FMT_YUYV
:
81 dst_pp_fmt
= VPU_PP_OUT_YUYV
;
84 WARN(1, "output format %d not supported by the post-processor, this wasn't expected.",
85 ctx
->vpu_dst_fmt
->fourcc
);
90 dst_buf
= v4l2_m2m_next_dst_buf(ctx
->fh
.m2m_ctx
);
91 dst_dma
= vb2_dma_contig_plane_dma_addr(&dst_buf
->vb2_buf
, 0);
93 HANTRO_PP_REG_WRITE(vpu
, clk_gate
, 0x1);
94 HANTRO_PP_REG_WRITE(vpu
, out_endian
, 0x1);
95 HANTRO_PP_REG_WRITE(vpu
, out_swap32
, 0x1);
96 HANTRO_PP_REG_WRITE(vpu
, max_burst
, 16);
97 HANTRO_PP_REG_WRITE(vpu
, out_luma_base
, dst_dma
);
98 HANTRO_PP_REG_WRITE(vpu
, input_width
, MB_WIDTH(ctx
->dst_fmt
.width
));
99 HANTRO_PP_REG_WRITE(vpu
, input_height
, MB_HEIGHT(ctx
->dst_fmt
.height
));
100 HANTRO_PP_REG_WRITE(vpu
, input_fmt
, src_pp_fmt
);
101 HANTRO_PP_REG_WRITE(vpu
, output_fmt
, dst_pp_fmt
);
102 HANTRO_PP_REG_WRITE(vpu
, output_width
, ctx
->dst_fmt
.width
);
103 HANTRO_PP_REG_WRITE(vpu
, output_height
, ctx
->dst_fmt
.height
);
104 HANTRO_PP_REG_WRITE(vpu
, orig_width
, MB_WIDTH(ctx
->dst_fmt
.width
));
105 HANTRO_PP_REG_WRITE(vpu
, display_width
, ctx
->dst_fmt
.width
);
108 static int down_scale_factor(struct hantro_ctx
*ctx
)
110 if (ctx
->src_fmt
.width
<= ctx
->dst_fmt
.width
)
113 return DIV_ROUND_CLOSEST(ctx
->src_fmt
.width
, ctx
->dst_fmt
.width
);
116 static void hantro_postproc_g2_enable(struct hantro_ctx
*ctx
)
118 struct hantro_dev
*vpu
= ctx
->dev
;
119 struct vb2_v4l2_buffer
*dst_buf
;
120 int down_scale
= down_scale_factor(ctx
);
122 size_t chroma_offset
;
125 dst_buf
= hantro_get_dst_buf(ctx
);
126 dst_dma
= vb2_dma_contig_plane_dma_addr(&dst_buf
->vb2_buf
, 0);
127 chroma_offset
= ctx
->dst_fmt
.plane_fmt
[0].bytesperline
*
131 hantro_reg_write(vpu
, &g2_down_scale_e
, 1);
132 hantro_reg_write(vpu
, &g2_down_scale_y
, down_scale
>> 2);
133 hantro_reg_write(vpu
, &g2_down_scale_x
, down_scale
>> 2);
134 hantro_write_addr(vpu
, G2_DS_DST
, dst_dma
);
135 hantro_write_addr(vpu
, G2_DS_DST_CHR
, dst_dma
+ (chroma_offset
>> down_scale
));
137 hantro_write_addr(vpu
, G2_RS_OUT_LUMA_ADDR
, dst_dma
);
138 hantro_write_addr(vpu
, G2_RS_OUT_CHROMA_ADDR
, dst_dma
+ chroma_offset
);
141 out_depth
= hantro_get_format_depth(ctx
->dst_fmt
.pixelformat
);
142 if (ctx
->dev
->variant
->legacy_regs
) {
146 pp_shift
= 16 - out_depth
;
148 hantro_reg_write(ctx
->dev
, &g2_rs_out_bit_depth
, out_depth
);
149 hantro_reg_write(ctx
->dev
, &g2_pp_pix_shift
, pp_shift
);
151 hantro_reg_write(vpu
, &g2_output_8_bits
, out_depth
> 8 ? 0 : 1);
152 hantro_reg_write(vpu
, &g2_output_format
, out_depth
> 8 ? 1 : 0);
154 hantro_reg_write(vpu
, &g2_out_rs_e
, 1);
157 static int hantro_postproc_g2_enum_framesizes(struct hantro_ctx
*ctx
,
158 struct v4l2_frmsizeenum
*fsize
)
161 * G2 scaler can scale down by 0, 2, 4 or 8
162 * use fsize->index has power of 2 diviser
164 if (fsize
->index
> 3)
167 if (!ctx
->src_fmt
.width
|| !ctx
->src_fmt
.height
)
170 fsize
->type
= V4L2_FRMSIZE_TYPE_DISCRETE
;
171 fsize
->discrete
.width
= ctx
->src_fmt
.width
>> fsize
->index
;
172 fsize
->discrete
.height
= ctx
->src_fmt
.height
>> fsize
->index
;
177 void hantro_postproc_free(struct hantro_ctx
*ctx
)
179 struct hantro_dev
*vpu
= ctx
->dev
;
180 struct v4l2_m2m_ctx
*m2m_ctx
= ctx
->fh
.m2m_ctx
;
181 struct vb2_queue
*queue
= &m2m_ctx
->cap_q_ctx
.q
;
184 for (i
= 0; i
< queue
->max_num_buffers
; ++i
) {
185 struct hantro_aux_buf
*priv
= &ctx
->postproc
.dec_q
[i
];
188 dma_free_attrs(vpu
->dev
, priv
->size
, priv
->cpu
,
189 priv
->dma
, priv
->attrs
);
195 static unsigned int hantro_postproc_buffer_size(struct hantro_ctx
*ctx
)
197 unsigned int buf_size
;
199 buf_size
= ctx
->ref_fmt
.plane_fmt
[0].sizeimage
;
200 if (ctx
->vpu_src_fmt
->fourcc
== V4L2_PIX_FMT_H264_SLICE
)
201 buf_size
+= hantro_h264_mv_size(ctx
->ref_fmt
.width
,
202 ctx
->ref_fmt
.height
);
203 else if (ctx
->vpu_src_fmt
->fourcc
== V4L2_PIX_FMT_VP9_FRAME
)
204 buf_size
+= hantro_vp9_mv_size(ctx
->ref_fmt
.width
,
205 ctx
->ref_fmt
.height
);
206 else if (ctx
->vpu_src_fmt
->fourcc
== V4L2_PIX_FMT_HEVC_SLICE
) {
207 buf_size
+= hantro_hevc_mv_size(ctx
->ref_fmt
.width
,
208 ctx
->ref_fmt
.height
);
209 if (ctx
->hevc_dec
.use_compression
)
210 buf_size
+= hantro_hevc_compressed_size(ctx
->ref_fmt
.width
,
211 ctx
->ref_fmt
.height
);
213 else if (ctx
->vpu_src_fmt
->fourcc
== V4L2_PIX_FMT_AV1_FRAME
)
214 buf_size
+= hantro_av1_mv_size(ctx
->ref_fmt
.width
,
215 ctx
->ref_fmt
.height
);
220 static int hantro_postproc_alloc(struct hantro_ctx
*ctx
, int index
)
222 struct hantro_dev
*vpu
= ctx
->dev
;
223 struct hantro_aux_buf
*priv
= &ctx
->postproc
.dec_q
[index
];
224 unsigned int buf_size
= hantro_postproc_buffer_size(ctx
);
230 * The buffers on this queue are meant as intermediate
231 * buffers for the decoder, so no mapping is needed.
233 priv
->attrs
= DMA_ATTR_NO_KERNEL_MAPPING
;
234 priv
->cpu
= dma_alloc_attrs(vpu
->dev
, buf_size
, &priv
->dma
,
235 GFP_KERNEL
, priv
->attrs
);
238 priv
->size
= buf_size
;
243 int hantro_postproc_init(struct hantro_ctx
*ctx
)
245 struct v4l2_m2m_ctx
*m2m_ctx
= ctx
->fh
.m2m_ctx
;
246 struct vb2_queue
*cap_queue
= &m2m_ctx
->cap_q_ctx
.q
;
247 unsigned int num_buffers
= vb2_get_num_buffers(cap_queue
);
251 for (i
= 0; i
< num_buffers
; i
++) {
252 ret
= hantro_postproc_alloc(ctx
, i
);
261 hantro_postproc_get_dec_buf_addr(struct hantro_ctx
*ctx
, int index
)
263 struct hantro_aux_buf
*priv
= &ctx
->postproc
.dec_q
[index
];
264 unsigned int buf_size
= hantro_postproc_buffer_size(ctx
);
265 struct hantro_dev
*vpu
= ctx
->dev
;
268 if (priv
->size
< buf_size
&& priv
->cpu
) {
269 /* buffer is too small, release it */
270 dma_free_attrs(vpu
->dev
, priv
->size
, priv
->cpu
,
271 priv
->dma
, priv
->attrs
);
276 /* buffer not already allocated, try getting a new one */
277 ret
= hantro_postproc_alloc(ctx
, index
);
288 static void hantro_postproc_g1_disable(struct hantro_ctx
*ctx
)
290 struct hantro_dev
*vpu
= ctx
->dev
;
292 HANTRO_PP_REG_WRITE(vpu
, pipeline_en
, 0x0);
295 static void hantro_postproc_g2_disable(struct hantro_ctx
*ctx
)
297 struct hantro_dev
*vpu
= ctx
->dev
;
299 hantro_reg_write(vpu
, &g2_out_rs_e
, 0);
302 void hantro_postproc_disable(struct hantro_ctx
*ctx
)
304 struct hantro_dev
*vpu
= ctx
->dev
;
306 if (vpu
->variant
->postproc_ops
&& vpu
->variant
->postproc_ops
->disable
)
307 vpu
->variant
->postproc_ops
->disable(ctx
);
310 void hantro_postproc_enable(struct hantro_ctx
*ctx
)
312 struct hantro_dev
*vpu
= ctx
->dev
;
314 if (vpu
->variant
->postproc_ops
&& vpu
->variant
->postproc_ops
->enable
)
315 vpu
->variant
->postproc_ops
->enable(ctx
);
318 int hanto_postproc_enum_framesizes(struct hantro_ctx
*ctx
,
319 struct v4l2_frmsizeenum
*fsize
)
321 struct hantro_dev
*vpu
= ctx
->dev
;
323 if (vpu
->variant
->postproc_ops
&& vpu
->variant
->postproc_ops
->enum_framesizes
)
324 return vpu
->variant
->postproc_ops
->enum_framesizes(ctx
, fsize
);
329 const struct hantro_postproc_ops hantro_g1_postproc_ops
= {
330 .enable
= hantro_postproc_g1_enable
,
331 .disable
= hantro_postproc_g1_disable
,
334 const struct hantro_postproc_ops hantro_g2_postproc_ops
= {
335 .enable
= hantro_postproc_g2_enable
,
336 .disable
= hantro_postproc_g2_disable
,
337 .enum_framesizes
= hantro_postproc_g2_enum_framesizes
,