| // SPDX-License-Identifier: GPL-2.0+ |
| /* |
| * Copyright (C) 2018 BayLibre, SAS |
| * Author: Maxime Jourdan <mjourdan@baylibre.com> |
| * |
| * The Elementary Stream Parser is a HW bitstream parser. |
| * It reads bitstream buffers and feeds them to the VIFIFO |
| */ |
| |
| #include <linux/init.h> |
| #include <linux/ioctl.h> |
| #include <linux/list.h> |
| #include <linux/module.h> |
| #include <linux/of_device.h> |
| #include <linux/reset.h> |
| #include <linux/interrupt.h> |
| #include <media/videobuf2-dma-contig.h> |
| #include <media/v4l2-mem2mem.h> |
| |
| #include "dos_regs.h" |
| #include "esparser.h" |
| #include "vdec_helpers.h" |
| |
| /* PARSER REGS (CBUS) */ |
| #define PARSER_CONTROL 0x00 |
| #define ES_PACK_SIZE_BIT 8 |
| #define ES_WRITE BIT(5) |
| #define ES_SEARCH BIT(1) |
| #define ES_PARSER_START BIT(0) |
| #define PARSER_FETCH_ADDR 0x4 |
| #define PARSER_FETCH_CMD 0x8 |
| #define PARSER_CONFIG 0x14 |
| #define PS_CFG_MAX_FETCH_CYCLE_BIT 0 |
| #define PS_CFG_STARTCODE_WID_24_BIT 10 |
| #define PS_CFG_MAX_ES_WR_CYCLE_BIT 12 |
| #define PS_CFG_PFIFO_EMPTY_CNT_BIT 16 |
| #define PFIFO_WR_PTR 0x18 |
| #define PFIFO_RD_PTR 0x1c |
| #define PARSER_SEARCH_PATTERN 0x24 |
| #define ES_START_CODE_PATTERN 0x00000100 |
| #define PARSER_SEARCH_MASK 0x28 |
| #define ES_START_CODE_MASK 0xffffff00 |
| #define FETCH_ENDIAN_BIT 27 |
| #define PARSER_INT_ENABLE 0x2c |
| #define PARSER_INT_HOST_EN_BIT 8 |
| #define PARSER_INT_STATUS 0x30 |
| #define PARSER_INTSTAT_SC_FOUND 1 |
| #define PARSER_ES_CONTROL 0x5c |
| #define PARSER_VIDEO_START_PTR 0x80 |
| #define PARSER_VIDEO_END_PTR 0x84 |
| #define PARSER_VIDEO_WP 0x88 |
| #define PARSER_VIDEO_HOLE 0x90 |
| |
| #define SEARCH_PATTERN_LEN 512 |
| #define VP9_HEADER_SIZE 16 |
| |
| static DECLARE_WAIT_QUEUE_HEAD(wq); |
| static int search_done; |
| |
| static irqreturn_t esparser_isr(int irq, void *dev) |
| { |
| int int_status; |
| struct amvdec_core *core = dev; |
| |
| int_status = amvdec_read_parser(core, PARSER_INT_STATUS); |
| amvdec_write_parser(core, PARSER_INT_STATUS, int_status); |
| |
| if (int_status & PARSER_INTSTAT_SC_FOUND) { |
| amvdec_write_parser(core, PFIFO_RD_PTR, 0); |
| amvdec_write_parser(core, PFIFO_WR_PTR, 0); |
| search_done = 1; |
| wake_up_interruptible(&wq); |
| } |
| |
| return IRQ_HANDLED; |
| } |
| |
| /* |
| * VP9 frame headers need to be appended by a 16-byte long |
| * Amlogic custom header |
| */ |
| static int vp9_update_header(struct amvdec_core *core, struct vb2_buffer *buf) |
| { |
| u8 *dp; |
| u8 marker; |
| int dsize; |
| int num_frames, cur_frame; |
| int cur_mag, mag, mag_ptr; |
| int frame_size[8], tot_frame_size[8]; |
| int total_datasize = 0; |
| int new_frame_size; |
| unsigned char *old_header = NULL; |
| |
| dp = (uint8_t *)vb2_plane_vaddr(buf, 0); |
| dsize = vb2_get_plane_payload(buf, 0); |
| |
| if (dsize == vb2_plane_size(buf, 0)) { |
| dev_warn(core->dev, "%s: unable to update header\n", __func__); |
| return 0; |
| } |
| |
| marker = dp[dsize - 1]; |
| if ((marker & 0xe0) == 0xc0) { |
| num_frames = (marker & 0x7) + 1; |
| mag = ((marker >> 3) & 0x3) + 1; |
| mag_ptr = dsize - mag * num_frames - 2; |
| if (dp[mag_ptr] != marker) |
| return 0; |
| |
| mag_ptr++; |
| for (cur_frame = 0; cur_frame < num_frames; cur_frame++) { |
| frame_size[cur_frame] = 0; |
| for (cur_mag = 0; cur_mag < mag; cur_mag++) { |
| frame_size[cur_frame] |= |
| (dp[mag_ptr] << (cur_mag * 8)); |
| mag_ptr++; |
| } |
| if (cur_frame == 0) |
| tot_frame_size[cur_frame] = |
| frame_size[cur_frame]; |
| else |
| tot_frame_size[cur_frame] = |
| tot_frame_size[cur_frame - 1] + |
| frame_size[cur_frame]; |
| total_datasize += frame_size[cur_frame]; |
| } |
| } else { |
| num_frames = 1; |
| frame_size[0] = dsize; |
| tot_frame_size[0] = dsize; |
| total_datasize = dsize; |
| } |
| |
| new_frame_size = total_datasize + num_frames * VP9_HEADER_SIZE; |
| |
| if (new_frame_size >= vb2_plane_size(buf, 0)) { |
| dev_warn(core->dev, "%s: unable to update header\n", __func__); |
| return 0; |
| } |
| |
| for (cur_frame = num_frames - 1; cur_frame >= 0; cur_frame--) { |
| int framesize = frame_size[cur_frame]; |
| int framesize_header = framesize + 4; |
| int oldframeoff = tot_frame_size[cur_frame] - framesize; |
| int outheaderoff = oldframeoff + cur_frame * VP9_HEADER_SIZE; |
| u8 *fdata = dp + outheaderoff; |
| u8 *old_framedata = dp + oldframeoff; |
| |
| memmove(fdata + VP9_HEADER_SIZE, old_framedata, framesize); |
| |
| fdata[0] = (framesize_header >> 24) & 0xff; |
| fdata[1] = (framesize_header >> 16) & 0xff; |
| fdata[2] = (framesize_header >> 8) & 0xff; |
| fdata[3] = (framesize_header >> 0) & 0xff; |
| fdata[4] = ((framesize_header >> 24) & 0xff) ^ 0xff; |
| fdata[5] = ((framesize_header >> 16) & 0xff) ^ 0xff; |
| fdata[6] = ((framesize_header >> 8) & 0xff) ^ 0xff; |
| fdata[7] = ((framesize_header >> 0) & 0xff) ^ 0xff; |
| fdata[8] = 0; |
| fdata[9] = 0; |
| fdata[10] = 0; |
| fdata[11] = 1; |
| fdata[12] = 'A'; |
| fdata[13] = 'M'; |
| fdata[14] = 'L'; |
| fdata[15] = 'V'; |
| |
| if (!old_header) { |
| /* nothing */ |
| } else if (old_header > fdata + 16 + framesize) { |
| dev_dbg(core->dev, "%s: data has gaps, setting to 0\n", |
| __func__); |
| memset(fdata + 16 + framesize, 0, |
| (old_header - fdata + 16 + framesize)); |
| } else if (old_header < fdata + 16 + framesize) { |
| dev_err(core->dev, "%s: data overwritten\n", __func__); |
| } |
| old_header = fdata; |
| } |
| |
| return new_frame_size; |
| } |
| |
| /* Pad the packet to at least 4KiB bytes otherwise the VDEC unit won't trigger |
| * ISRs. |
| * Also append a start code 000001ff at the end to trigger |
| * the ESPARSER interrupt. |
| */ |
| static u32 esparser_pad_start_code(struct amvdec_core *core, |
| struct vb2_buffer *vb, |
| u32 payload_size) |
| { |
| u32 pad_size = 0; |
| u8 *vaddr = vb2_plane_vaddr(vb, 0); |
| |
| if (payload_size < ESPARSER_MIN_PACKET_SIZE) { |
| pad_size = ESPARSER_MIN_PACKET_SIZE - payload_size; |
| memset(vaddr + payload_size, 0, pad_size); |
| } |
| |
| if ((payload_size + pad_size + SEARCH_PATTERN_LEN) > |
| vb2_plane_size(vb, 0)) { |
| dev_warn(core->dev, "%s: unable to pad start code\n", __func__); |
| return pad_size; |
| } |
| |
| memset(vaddr + payload_size + pad_size, 0, SEARCH_PATTERN_LEN); |
| vaddr[payload_size + pad_size] = 0x00; |
| vaddr[payload_size + pad_size + 1] = 0x00; |
| vaddr[payload_size + pad_size + 2] = 0x01; |
| vaddr[payload_size + pad_size + 3] = 0xff; |
| |
| return pad_size; |
| } |
| |
| static int |
| esparser_write_data(struct amvdec_core *core, dma_addr_t addr, u32 size) |
| { |
| amvdec_write_parser(core, PFIFO_RD_PTR, 0); |
| amvdec_write_parser(core, PFIFO_WR_PTR, 0); |
| amvdec_write_parser(core, PARSER_CONTROL, |
| ES_WRITE | |
| ES_PARSER_START | |
| ES_SEARCH | |
| (size << ES_PACK_SIZE_BIT)); |
| |
| amvdec_write_parser(core, PARSER_FETCH_ADDR, addr); |
| amvdec_write_parser(core, PARSER_FETCH_CMD, |
| (7 << FETCH_ENDIAN_BIT) | |
| (size + SEARCH_PATTERN_LEN)); |
| |
| search_done = 0; |
| return wait_event_interruptible_timeout(wq, search_done, (HZ / 5)); |
| } |
| |
| static u32 esparser_vififo_get_free_space(struct amvdec_session *sess) |
| { |
| u32 vififo_usage; |
| struct amvdec_ops *vdec_ops = sess->fmt_out->vdec_ops; |
| struct amvdec_core *core = sess->core; |
| |
| vififo_usage = vdec_ops->vififo_level(sess); |
| vififo_usage += amvdec_read_parser(core, PARSER_VIDEO_HOLE); |
| vififo_usage += (6 * SZ_1K); // 6 KiB internal fifo |
| |
| if (vififo_usage > sess->vififo_size) { |
| dev_warn(sess->core->dev, |
| "VIFIFO usage (%u) > VIFIFO size (%u)\n", |
| vififo_usage, sess->vififo_size); |
| return 0; |
| } |
| |
| return sess->vififo_size - vififo_usage; |
| } |
| |
| int esparser_queue_eos(struct amvdec_core *core, const u8 *data, u32 len) |
| { |
| struct device *dev = core->dev; |
| void *eos_vaddr; |
| dma_addr_t eos_paddr; |
| int ret; |
| |
| eos_vaddr = dma_alloc_coherent(dev, len + SEARCH_PATTERN_LEN, |
| &eos_paddr, GFP_KERNEL); |
| if (!eos_vaddr) |
| return -ENOMEM; |
| |
| memcpy(eos_vaddr, data, len); |
| ret = esparser_write_data(core, eos_paddr, len); |
| dma_free_coherent(dev, len + SEARCH_PATTERN_LEN, |
| eos_vaddr, eos_paddr); |
| |
| return ret; |
| } |
| |
| static u32 esparser_get_offset(struct amvdec_session *sess) |
| { |
| struct amvdec_core *core = sess->core; |
| u32 offset = amvdec_read_parser(core, PARSER_VIDEO_WP) - |
| sess->vififo_paddr; |
| |
| if (offset < sess->last_offset) |
| sess->wrap_count++; |
| |
| sess->last_offset = offset; |
| offset += (sess->wrap_count * sess->vififo_size); |
| |
| return offset; |
| } |
| |
| static int |
| esparser_queue(struct amvdec_session *sess, struct vb2_v4l2_buffer *vbuf) |
| { |
| int ret; |
| struct vb2_buffer *vb = &vbuf->vb2_buf; |
| struct amvdec_core *core = sess->core; |
| struct amvdec_codec_ops *codec_ops = sess->fmt_out->codec_ops; |
| u32 payload_size = vb2_get_plane_payload(vb, 0); |
| dma_addr_t phy = vb2_dma_contig_plane_dma_addr(vb, 0); |
| u32 num_dst_bufs = 0; |
| u32 offset; |
| u32 pad_size; |
| |
| /* |
| * When max ref frame is held by VP9, this should be -= 3 to prevent a |
| * shortage of CAPTURE buffers on the decoder side. |
| * For the future, a good enhancement of the way this is handled could |
| * be to notify new capture buffers to the decoding modules, so that |
| * they could pause when there is no capture buffer available and |
| * resume on this notification. |
| */ |
| if (sess->fmt_out->pixfmt == V4L2_PIX_FMT_VP9) { |
| if (codec_ops->num_pending_bufs) |
| num_dst_bufs = codec_ops->num_pending_bufs(sess); |
| |
| num_dst_bufs += v4l2_m2m_num_dst_bufs_ready(sess->m2m_ctx); |
| if (sess->fmt_out->pixfmt == V4L2_PIX_FMT_VP9) |
| num_dst_bufs -= 3; |
| |
| if (esparser_vififo_get_free_space(sess) < payload_size || |
| atomic_read(&sess->esparser_queued_bufs) >= num_dst_bufs) |
| return -EAGAIN; |
| } else if (esparser_vififo_get_free_space(sess) < payload_size) { |
| return -EAGAIN; |
| } |
| |
| v4l2_m2m_src_buf_remove_by_buf(sess->m2m_ctx, vbuf); |
| |
| offset = esparser_get_offset(sess); |
| |
| amvdec_add_ts(sess, vb->timestamp, vbuf->timecode, offset, vbuf->flags); |
| dev_dbg(core->dev, "esparser: ts = %llu pld_size = %u offset = %08X flags = %08X\n", |
| vb->timestamp, payload_size, offset, vbuf->flags); |
| |
| vbuf->flags = 0; |
| vbuf->field = V4L2_FIELD_NONE; |
| vbuf->sequence = sess->sequence_out++; |
| |
| if (sess->fmt_out->pixfmt == V4L2_PIX_FMT_VP9) { |
| payload_size = vp9_update_header(core, vb); |
| |
| /* If unable to alter buffer to add headers */ |
| if (payload_size == 0) { |
| amvdec_remove_ts(sess, vb->timestamp); |
| v4l2_m2m_buf_done(vbuf, VB2_BUF_STATE_ERROR); |
| |
| return 0; |
| } |
| } |
| |
| pad_size = esparser_pad_start_code(core, vb, payload_size); |
| ret = esparser_write_data(core, phy, payload_size + pad_size); |
| |
| if (ret <= 0) { |
| dev_warn(core->dev, "esparser: input parsing error\n"); |
| amvdec_remove_ts(sess, vb->timestamp); |
| v4l2_m2m_buf_done(vbuf, VB2_BUF_STATE_ERROR); |
| amvdec_write_parser(core, PARSER_FETCH_CMD, 0); |
| |
| return 0; |
| } |
| |
| atomic_inc(&sess->esparser_queued_bufs); |
| v4l2_m2m_buf_done(vbuf, VB2_BUF_STATE_DONE); |
| |
| return 0; |
| } |
| |
| void esparser_queue_all_src(struct work_struct *work) |
| { |
| struct v4l2_m2m_buffer *buf, *n; |
| struct amvdec_session *sess = |
| container_of(work, struct amvdec_session, esparser_queue_work); |
| |
| mutex_lock(&sess->lock); |
| v4l2_m2m_for_each_src_buf_safe(sess->m2m_ctx, buf, n) { |
| if (sess->should_stop) |
| break; |
| |
| if (esparser_queue(sess, &buf->vb) < 0) |
| break; |
| } |
| mutex_unlock(&sess->lock); |
| } |
| |
| int esparser_power_up(struct amvdec_session *sess) |
| { |
| struct amvdec_core *core = sess->core; |
| struct amvdec_ops *vdec_ops = sess->fmt_out->vdec_ops; |
| |
| reset_control_reset(core->esparser_reset); |
| amvdec_write_parser(core, PARSER_CONFIG, |
| (10 << PS_CFG_PFIFO_EMPTY_CNT_BIT) | |
| (1 << PS_CFG_MAX_ES_WR_CYCLE_BIT) | |
| (16 << PS_CFG_MAX_FETCH_CYCLE_BIT)); |
| |
| amvdec_write_parser(core, PFIFO_RD_PTR, 0); |
| amvdec_write_parser(core, PFIFO_WR_PTR, 0); |
| |
| amvdec_write_parser(core, PARSER_SEARCH_PATTERN, |
| ES_START_CODE_PATTERN); |
| amvdec_write_parser(core, PARSER_SEARCH_MASK, ES_START_CODE_MASK); |
| |
| amvdec_write_parser(core, PARSER_CONFIG, |
| (10 << PS_CFG_PFIFO_EMPTY_CNT_BIT) | |
| (1 << PS_CFG_MAX_ES_WR_CYCLE_BIT) | |
| (16 << PS_CFG_MAX_FETCH_CYCLE_BIT) | |
| (2 << PS_CFG_STARTCODE_WID_24_BIT)); |
| |
| amvdec_write_parser(core, PARSER_CONTROL, |
| (ES_SEARCH | ES_PARSER_START)); |
| |
| amvdec_write_parser(core, PARSER_VIDEO_START_PTR, sess->vififo_paddr); |
| amvdec_write_parser(core, PARSER_VIDEO_END_PTR, |
| sess->vififo_paddr + sess->vififo_size - 8); |
| amvdec_write_parser(core, PARSER_ES_CONTROL, |
| amvdec_read_parser(core, PARSER_ES_CONTROL) & ~1); |
| |
| if (vdec_ops->conf_esparser) |
| vdec_ops->conf_esparser(sess); |
| |
| amvdec_write_parser(core, PARSER_INT_STATUS, 0xffff); |
| amvdec_write_parser(core, PARSER_INT_ENABLE, |
| BIT(PARSER_INT_HOST_EN_BIT)); |
| |
| return 0; |
| } |
| |
| int esparser_init(struct platform_device *pdev, struct amvdec_core *core) |
| { |
| struct device *dev = &pdev->dev; |
| int ret; |
| int irq; |
| |
| irq = platform_get_irq_byname(pdev, "esparser"); |
| if (irq < 0) |
| return irq; |
| |
| ret = devm_request_irq(dev, irq, esparser_isr, IRQF_SHARED, |
| "esparserirq", core); |
| if (ret) { |
| dev_err(dev, "Failed requesting ESPARSER IRQ\n"); |
| return ret; |
| } |
| |
| core->esparser_reset = |
| devm_reset_control_get_exclusive(dev, "esparser"); |
| if (IS_ERR(core->esparser_reset)) { |
| dev_err(dev, "Failed to get esparser_reset\n"); |
| return PTR_ERR(core->esparser_reset); |
| } |
| |
| return 0; |
| } |