| // SPDX-License-Identifier: GPL-2.0 |
| /* |
| * Hantro VPU codec driver |
| * |
| * Copyright (C) 2018 Rockchip Electronics Co., Ltd. |
| * |
| * JPEG encoder |
| * ------------ |
| * The VPU JPEG encoder produces JPEG baseline sequential format. |
| * The quantization coefficients are 8-bit values, complying with |
| * the baseline specification. Therefore, it requires |
| * luma and chroma quantization tables. The hardware does entropy |
| * encoding using internal Huffman tables, as specified in the JPEG |
| * specification. |
| * |
| * In other words, only the luma and chroma quantization tables are |
| * required for the encoding operation. |
| * |
| * Quantization luma table values are written to registers |
| * VEPU_swreg_0-VEPU_swreg_15, and chroma table values to |
| * VEPU_swreg_16-VEPU_swreg_31. |
| * |
| * JPEG zigzag order is expected on the quantization tables. |
| */ |
| |
| #include <asm/unaligned.h> |
| #include <media/v4l2-mem2mem.h> |
| #include "hantro_jpeg.h" |
| #include "hantro.h" |
| #include "hantro_v4l2.h" |
| #include "hantro_hw.h" |
| #include "rk3399_vpu_regs.h" |
| |
| #define VEPU_JPEG_QUANT_TABLE_COUNT 16 |
| |
| static void rk3399_vpu_set_src_img_ctrl(struct hantro_dev *vpu, |
| struct hantro_ctx *ctx) |
| { |
| struct v4l2_pix_format_mplane *pix_fmt = &ctx->src_fmt; |
| u32 reg; |
| |
| /* |
| * The pix fmt width/height are already macroblock aligned |
| * by .vidioc_s_fmt_vid_cap_mplane() callback |
| */ |
| reg = VEPU_REG_IN_IMG_CTRL_ROW_LEN(pix_fmt->width); |
| vepu_write_relaxed(vpu, reg, VEPU_REG_INPUT_LUMA_INFO); |
| |
| reg = VEPU_REG_IN_IMG_CTRL_OVRFLR_D4(0) | |
| VEPU_REG_IN_IMG_CTRL_OVRFLB(0); |
| /* |
| * This register controls the input crop, as the offset |
| * from the right/bottom within the last macroblock. The offset from the |
| * right must be divided by 4 and so the crop must be aligned to 4 pixels |
| * horizontally. |
| */ |
| vepu_write_relaxed(vpu, reg, VEPU_REG_ENC_OVER_FILL_STRM_OFFSET); |
| |
| reg = VEPU_REG_IN_IMG_CTRL_FMT(ctx->vpu_src_fmt->enc_fmt); |
| vepu_write_relaxed(vpu, reg, VEPU_REG_ENC_CTRL1); |
| } |
| |
| static void rk3399_vpu_jpeg_enc_set_buffers(struct hantro_dev *vpu, |
| struct hantro_ctx *ctx, |
| struct vb2_buffer *src_buf) |
| { |
| struct v4l2_pix_format_mplane *pix_fmt = &ctx->src_fmt; |
| dma_addr_t src[3]; |
| |
| WARN_ON(pix_fmt->num_planes > 3); |
| |
| vepu_write_relaxed(vpu, ctx->jpeg_enc.bounce_buffer.dma, |
| VEPU_REG_ADDR_OUTPUT_STREAM); |
| vepu_write_relaxed(vpu, ctx->jpeg_enc.bounce_buffer.size, |
| VEPU_REG_STR_BUF_LIMIT); |
| |
| if (pix_fmt->num_planes == 1) { |
| src[0] = vb2_dma_contig_plane_dma_addr(src_buf, 0); |
| vepu_write_relaxed(vpu, src[0], VEPU_REG_ADDR_IN_PLANE_0); |
| } else if (pix_fmt->num_planes == 2) { |
| src[0] = vb2_dma_contig_plane_dma_addr(src_buf, 0); |
| src[1] = vb2_dma_contig_plane_dma_addr(src_buf, 1); |
| vepu_write_relaxed(vpu, src[0], VEPU_REG_ADDR_IN_PLANE_0); |
| vepu_write_relaxed(vpu, src[1], VEPU_REG_ADDR_IN_PLANE_1); |
| } else { |
| src[0] = vb2_dma_contig_plane_dma_addr(src_buf, 0); |
| src[1] = vb2_dma_contig_plane_dma_addr(src_buf, 1); |
| src[2] = vb2_dma_contig_plane_dma_addr(src_buf, 2); |
| vepu_write_relaxed(vpu, src[0], VEPU_REG_ADDR_IN_PLANE_0); |
| vepu_write_relaxed(vpu, src[1], VEPU_REG_ADDR_IN_PLANE_1); |
| vepu_write_relaxed(vpu, src[2], VEPU_REG_ADDR_IN_PLANE_2); |
| } |
| } |
| |
| static void |
| rk3399_vpu_jpeg_enc_set_qtable(struct hantro_dev *vpu, |
| unsigned char *luma_qtable, |
| unsigned char *chroma_qtable) |
| { |
| u32 reg, i; |
| |
| for (i = 0; i < VEPU_JPEG_QUANT_TABLE_COUNT; i++) { |
| reg = get_unaligned_be32(&luma_qtable[i]); |
| vepu_write_relaxed(vpu, reg, VEPU_REG_JPEG_LUMA_QUAT(i)); |
| |
| reg = get_unaligned_be32(&chroma_qtable[i]); |
| vepu_write_relaxed(vpu, reg, VEPU_REG_JPEG_CHROMA_QUAT(i)); |
| } |
| } |
| |
| void rk3399_vpu_jpeg_enc_run(struct hantro_ctx *ctx) |
| { |
| struct hantro_dev *vpu = ctx->dev; |
| struct vb2_v4l2_buffer *src_buf, *dst_buf; |
| struct hantro_jpeg_ctx jpeg_ctx; |
| u32 reg; |
| |
| src_buf = hantro_get_src_buf(ctx); |
| dst_buf = hantro_get_dst_buf(ctx); |
| |
| hantro_start_prepare_run(ctx); |
| |
| memset(&jpeg_ctx, 0, sizeof(jpeg_ctx)); |
| jpeg_ctx.buffer = vb2_plane_vaddr(&dst_buf->vb2_buf, 0); |
| jpeg_ctx.width = ctx->dst_fmt.width; |
| jpeg_ctx.height = ctx->dst_fmt.height; |
| jpeg_ctx.quality = ctx->jpeg_quality; |
| hantro_jpeg_header_assemble(&jpeg_ctx); |
| |
| /* Switch to JPEG encoder mode before writing registers */ |
| vepu_write_relaxed(vpu, VEPU_REG_ENCODE_FORMAT_JPEG, |
| VEPU_REG_ENCODE_START); |
| |
| rk3399_vpu_set_src_img_ctrl(vpu, ctx); |
| rk3399_vpu_jpeg_enc_set_buffers(vpu, ctx, &src_buf->vb2_buf); |
| rk3399_vpu_jpeg_enc_set_qtable(vpu, |
| hantro_jpeg_get_qtable(&jpeg_ctx, 0), |
| hantro_jpeg_get_qtable(&jpeg_ctx, 1)); |
| |
| reg = VEPU_REG_OUTPUT_SWAP32 |
| | VEPU_REG_OUTPUT_SWAP16 |
| | VEPU_REG_OUTPUT_SWAP8 |
| | VEPU_REG_INPUT_SWAP8 |
| | VEPU_REG_INPUT_SWAP16 |
| | VEPU_REG_INPUT_SWAP32; |
| /* Make sure that all registers are written at this point. */ |
| vepu_write(vpu, reg, VEPU_REG_DATA_ENDIAN); |
| |
| reg = VEPU_REG_AXI_CTRL_BURST_LEN(16); |
| vepu_write_relaxed(vpu, reg, VEPU_REG_AXI_CTRL); |
| |
| reg = VEPU_REG_MB_WIDTH(MB_WIDTH(ctx->src_fmt.width)) |
| | VEPU_REG_MB_HEIGHT(MB_HEIGHT(ctx->src_fmt.height)) |
| | VEPU_REG_FRAME_TYPE_INTRA |
| | VEPU_REG_ENCODE_FORMAT_JPEG |
| | VEPU_REG_ENCODE_ENABLE; |
| |
| /* Kick the watchdog and start encoding */ |
| hantro_end_prepare_run(ctx); |
| vepu_write(vpu, reg, VEPU_REG_ENCODE_START); |
| } |