| // SPDX-License-Identifier: GPL-2.0-or-later |
| /* |
| * Coda multi-standard codec IP - JPEG support functions |
| * |
| * Copyright (C) 2014 Philipp Zabel, Pengutronix |
| */ |
| |
| #include <asm/unaligned.h> |
| #include <linux/irqreturn.h> |
| #include <linux/kernel.h> |
| #include <linux/ktime.h> |
| #include <linux/slab.h> |
| #include <linux/swab.h> |
| #include <linux/videodev2.h> |
| |
| #include <media/v4l2-common.h> |
| #include <media/v4l2-fh.h> |
| #include <media/v4l2-jpeg.h> |
| #include <media/v4l2-mem2mem.h> |
| #include <media/videobuf2-core.h> |
| #include <media/videobuf2-dma-contig.h> |
| |
| #include "coda.h" |
| #include "trace.h" |
| |
| #define SOI_MARKER 0xffd8 |
| #define APP9_MARKER 0xffe9 |
| #define DRI_MARKER 0xffdd |
| #define DQT_MARKER 0xffdb |
| #define DHT_MARKER 0xffc4 |
| #define SOF_MARKER 0xffc0 |
| #define SOS_MARKER 0xffda |
| #define EOI_MARKER 0xffd9 |
| |
| enum { |
| CODA9_JPEG_FORMAT_420, |
| CODA9_JPEG_FORMAT_422, |
| CODA9_JPEG_FORMAT_224, |
| CODA9_JPEG_FORMAT_444, |
| CODA9_JPEG_FORMAT_400, |
| }; |
| |
| struct coda_huff_tab { |
| u8 luma_dc[16 + 12]; |
| u8 chroma_dc[16 + 12]; |
| u8 luma_ac[16 + 162]; |
| u8 chroma_ac[16 + 162]; |
| |
| /* DC Luma, DC Chroma, AC Luma, AC Chroma */ |
| s16 min[4 * 16]; |
| s16 max[4 * 16]; |
| s8 ptr[4 * 16]; |
| }; |
| |
| #define CODA9_JPEG_ENC_HUFF_DATA_SIZE (256 + 256 + 16 + 16) |
| |
| /* |
| * Typical Huffman tables for 8-bit precision luminance and |
| * chrominance from JPEG ITU-T.81 (ISO/IEC 10918-1) Annex K.3 |
| */ |
| |
| static const unsigned char luma_dc[16 + 12] = { |
| /* bits */ |
| 0x00, 0x01, 0x05, 0x01, 0x01, 0x01, 0x01, 0x01, |
| 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, |
| /* values */ |
| 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, |
| 0x08, 0x09, 0x0a, 0x0b, |
| }; |
| |
| static const unsigned char chroma_dc[16 + 12] = { |
| /* bits */ |
| 0x00, 0x03, 0x01, 0x01, 0x01, 0x01, 0x01, 0x01, |
| 0x01, 0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, |
| /* values */ |
| 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, |
| 0x08, 0x09, 0x0a, 0x0b, |
| }; |
| |
| static const unsigned char luma_ac[16 + 162 + 2] = { |
| /* bits */ |
| 0x00, 0x02, 0x01, 0x03, 0x03, 0x02, 0x04, 0x03, |
| 0x05, 0x05, 0x04, 0x04, 0x00, 0x00, 0x01, 0x7d, |
| /* values */ |
| 0x01, 0x02, 0x03, 0x00, 0x04, 0x11, 0x05, 0x12, |
| 0x21, 0x31, 0x41, 0x06, 0x13, 0x51, 0x61, 0x07, |
| 0x22, 0x71, 0x14, 0x32, 0x81, 0x91, 0xa1, 0x08, |
| 0x23, 0x42, 0xb1, 0xc1, 0x15, 0x52, 0xd1, 0xf0, |
| 0x24, 0x33, 0x62, 0x72, 0x82, 0x09, 0x0a, 0x16, |
| 0x17, 0x18, 0x19, 0x1a, 0x25, 0x26, 0x27, 0x28, |
| 0x29, 0x2a, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39, |
| 0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49, |
| 0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, |
| 0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68, 0x69, |
| 0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79, |
| 0x7a, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88, 0x89, |
| 0x8a, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, 0x98, |
| 0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, |
| 0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, |
| 0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3, 0xc4, 0xc5, |
| 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2, 0xd3, 0xd4, |
| 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, 0xe1, 0xe2, |
| 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9, 0xea, |
| 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8, |
| 0xf9, 0xfa, /* padded to 32-bit */ |
| }; |
| |
| static const unsigned char chroma_ac[16 + 162 + 2] = { |
| /* bits */ |
| 0x00, 0x02, 0x01, 0x02, 0x04, 0x04, 0x03, 0x04, |
| 0x07, 0x05, 0x04, 0x04, 0x00, 0x01, 0x02, 0x77, |
| /* values */ |
| 0x00, 0x01, 0x02, 0x03, 0x11, 0x04, 0x05, 0x21, |
| 0x31, 0x06, 0x12, 0x41, 0x51, 0x07, 0x61, 0x71, |
| 0x13, 0x22, 0x32, 0x81, 0x08, 0x14, 0x42, 0x91, |
| 0xa1, 0xb1, 0xc1, 0x09, 0x23, 0x33, 0x52, 0xf0, |
| 0x15, 0x62, 0x72, 0xd1, 0x0a, 0x16, 0x24, 0x34, |
| 0xe1, 0x25, 0xf1, 0x17, 0x18, 0x19, 0x1a, 0x26, |
| 0x27, 0x28, 0x29, 0x2a, 0x35, 0x36, 0x37, 0x38, |
| 0x39, 0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, |
| 0x49, 0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, |
| 0x59, 0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68, |
| 0x69, 0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, |
| 0x79, 0x7a, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, |
| 0x88, 0x89, 0x8a, 0x92, 0x93, 0x94, 0x95, 0x96, |
| 0x97, 0x98, 0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5, |
| 0xa6, 0xa7, 0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4, |
| 0xb5, 0xb6, 0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3, |
| 0xc4, 0xc5, 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2, |
| 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, |
| 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9, |
| 0xea, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8, |
| 0xf9, 0xfa, /* padded to 32-bit */ |
| }; |
| |
| /* |
| * Quantization tables for luminance and chrominance components in |
| * zig-zag scan order from the Freescale i.MX VPU libraries |
| */ |
| |
| static unsigned char luma_q[64] = { |
| 0x06, 0x04, 0x04, 0x04, 0x05, 0x04, 0x06, 0x05, |
| 0x05, 0x06, 0x09, 0x06, 0x05, 0x06, 0x09, 0x0b, |
| 0x08, 0x06, 0x06, 0x08, 0x0b, 0x0c, 0x0a, 0x0a, |
| 0x0b, 0x0a, 0x0a, 0x0c, 0x10, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x10, 0x0c, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, |
| }; |
| |
| static unsigned char chroma_q[64] = { |
| 0x07, 0x07, 0x07, 0x0d, 0x0c, 0x0d, 0x18, 0x10, |
| 0x10, 0x18, 0x14, 0x0e, 0x0e, 0x0e, 0x14, 0x14, |
| 0x0e, 0x0e, 0x0e, 0x0e, 0x14, 0x11, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x11, 0x11, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x11, 0x0c, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, |
| 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, 0x0c, |
| }; |
| |
| static const unsigned char width_align[] = { |
| [CODA9_JPEG_FORMAT_420] = 16, |
| [CODA9_JPEG_FORMAT_422] = 16, |
| [CODA9_JPEG_FORMAT_224] = 8, |
| [CODA9_JPEG_FORMAT_444] = 8, |
| [CODA9_JPEG_FORMAT_400] = 8, |
| }; |
| |
| static const unsigned char height_align[] = { |
| [CODA9_JPEG_FORMAT_420] = 16, |
| [CODA9_JPEG_FORMAT_422] = 8, |
| [CODA9_JPEG_FORMAT_224] = 16, |
| [CODA9_JPEG_FORMAT_444] = 8, |
| [CODA9_JPEG_FORMAT_400] = 8, |
| }; |
| |
| static int coda9_jpeg_chroma_format(u32 pixfmt) |
| { |
| switch (pixfmt) { |
| case V4L2_PIX_FMT_YUV420: |
| case V4L2_PIX_FMT_NV12: |
| return CODA9_JPEG_FORMAT_420; |
| case V4L2_PIX_FMT_YUV422P: |
| return CODA9_JPEG_FORMAT_422; |
| case V4L2_PIX_FMT_YUV444: |
| return CODA9_JPEG_FORMAT_444; |
| case V4L2_PIX_FMT_GREY: |
| return CODA9_JPEG_FORMAT_400; |
| } |
| return -EINVAL; |
| } |
| |
| struct coda_memcpy_desc { |
| int offset; |
| const void *src; |
| size_t len; |
| }; |
| |
| static void coda_memcpy_parabuf(void *parabuf, |
| const struct coda_memcpy_desc *desc) |
| { |
| u32 *dst = parabuf + desc->offset; |
| const u32 *src = desc->src; |
| int len = desc->len / 4; |
| int i; |
| |
| for (i = 0; i < len; i += 2) { |
| dst[i + 1] = swab32(src[i]); |
| dst[i] = swab32(src[i + 1]); |
| } |
| } |
| |
| int coda_jpeg_write_tables(struct coda_ctx *ctx) |
| { |
| int i; |
| static const struct coda_memcpy_desc huff[8] = { |
| { 0, luma_dc, sizeof(luma_dc) }, |
| { 32, luma_ac, sizeof(luma_ac) }, |
| { 216, chroma_dc, sizeof(chroma_dc) }, |
| { 248, chroma_ac, sizeof(chroma_ac) }, |
| }; |
| struct coda_memcpy_desc qmat[3] = { |
| { 512, ctx->params.jpeg_qmat_tab[0], 64 }, |
| { 576, ctx->params.jpeg_qmat_tab[1], 64 }, |
| { 640, ctx->params.jpeg_qmat_tab[1], 64 }, |
| }; |
| |
| /* Write huffman tables to parameter memory */ |
| for (i = 0; i < ARRAY_SIZE(huff); i++) |
| coda_memcpy_parabuf(ctx->parabuf.vaddr, huff + i); |
| |
| /* Write Q-matrix to parameter memory */ |
| for (i = 0; i < ARRAY_SIZE(qmat); i++) |
| coda_memcpy_parabuf(ctx->parabuf.vaddr, qmat + i); |
| |
| return 0; |
| } |
| |
| bool coda_jpeg_check_buffer(struct coda_ctx *ctx, struct vb2_buffer *vb) |
| { |
| void *vaddr = vb2_plane_vaddr(vb, 0); |
| u16 soi, eoi; |
| int len, i; |
| |
| soi = be16_to_cpup((__be16 *)vaddr); |
| if (soi != SOI_MARKER) |
| return false; |
| |
| len = vb2_get_plane_payload(vb, 0); |
| vaddr += len - 2; |
| for (i = 0; i < 32; i++) { |
| eoi = be16_to_cpup((__be16 *)(vaddr - i)); |
| if (eoi == EOI_MARKER) { |
| if (i > 0) |
| vb2_set_plane_payload(vb, 0, len - i); |
| return true; |
| } |
| } |
| |
| return false; |
| } |
| |
| static int coda9_jpeg_gen_dec_huff_tab(struct coda_ctx *ctx, int tab_num); |
| |
| int coda_jpeg_decode_header(struct coda_ctx *ctx, struct vb2_buffer *vb) |
| { |
| struct coda_dev *dev = ctx->dev; |
| u8 *buf = vb2_plane_vaddr(vb, 0); |
| size_t len = vb2_get_plane_payload(vb, 0); |
| struct v4l2_jpeg_scan_header scan_header; |
| struct v4l2_jpeg_reference quantization_tables[4] = { }; |
| struct v4l2_jpeg_reference huffman_tables[4] = { }; |
| struct v4l2_jpeg_header header = { |
| .scan = &scan_header, |
| .quantization_tables = quantization_tables, |
| .huffman_tables = huffman_tables, |
| }; |
| struct coda_q_data *q_data_src; |
| struct coda_huff_tab *huff_tab; |
| int i, j, ret; |
| |
| ret = v4l2_jpeg_parse_header(buf, len, &header); |
| if (ret < 0) { |
| v4l2_err(&dev->v4l2_dev, "failed to parse JPEG header: %pe\n", |
| ERR_PTR(ret)); |
| return ret; |
| } |
| |
| ctx->params.jpeg_restart_interval = header.restart_interval; |
| |
| /* check frame header */ |
| if (header.frame.height > ctx->codec->max_h || |
| header.frame.width > ctx->codec->max_w) { |
| v4l2_err(&dev->v4l2_dev, "invalid dimensions: %dx%d\n", |
| header.frame.width, header.frame.height); |
| return -EINVAL; |
| } |
| |
| q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT); |
| if (header.frame.height != q_data_src->height || |
| header.frame.width != q_data_src->width) { |
| v4l2_err(&dev->v4l2_dev, |
| "dimensions don't match format: %dx%d\n", |
| header.frame.width, header.frame.height); |
| return -EINVAL; |
| } |
| |
| if (header.frame.num_components != 3) { |
| v4l2_err(&dev->v4l2_dev, |
| "unsupported number of components: %d\n", |
| header.frame.num_components); |
| return -EINVAL; |
| } |
| |
| /* install quantization tables */ |
| if (quantization_tables[3].start) { |
| v4l2_err(&dev->v4l2_dev, |
| "only 3 quantization tables supported\n"); |
| return -EINVAL; |
| } |
| for (i = 0; i < 3; i++) { |
| if (!quantization_tables[i].start) |
| continue; |
| if (quantization_tables[i].length != 64) { |
| v4l2_err(&dev->v4l2_dev, |
| "only 8-bit quantization tables supported\n"); |
| continue; |
| } |
| if (!ctx->params.jpeg_qmat_tab[i]) { |
| ctx->params.jpeg_qmat_tab[i] = kmalloc(64, GFP_KERNEL); |
| if (!ctx->params.jpeg_qmat_tab[i]) |
| return -ENOMEM; |
| } |
| memcpy(ctx->params.jpeg_qmat_tab[i], |
| quantization_tables[i].start, 64); |
| } |
| |
| /* install Huffman tables */ |
| for (i = 0; i < 4; i++) { |
| if (!huffman_tables[i].start) { |
| v4l2_err(&dev->v4l2_dev, "missing Huffman table\n"); |
| return -EINVAL; |
| } |
| /* AC tables should be between 17 -> 178, DC between 17 -> 28 */ |
| if (huffman_tables[i].length < 17 || |
| huffman_tables[i].length > 178 || |
| ((i & 2) == 0 && huffman_tables[i].length > 28)) { |
| v4l2_err(&dev->v4l2_dev, |
| "invalid Huffman table %d length: %zu\n", |
| i, huffman_tables[i].length); |
| return -EINVAL; |
| } |
| } |
| huff_tab = ctx->params.jpeg_huff_tab; |
| if (!huff_tab) { |
| huff_tab = kzalloc(sizeof(struct coda_huff_tab), GFP_KERNEL); |
| if (!huff_tab) |
| return -ENOMEM; |
| ctx->params.jpeg_huff_tab = huff_tab; |
| } |
| |
| memset(huff_tab, 0, sizeof(*huff_tab)); |
| memcpy(huff_tab->luma_dc, huffman_tables[0].start, huffman_tables[0].length); |
| memcpy(huff_tab->chroma_dc, huffman_tables[1].start, huffman_tables[1].length); |
| memcpy(huff_tab->luma_ac, huffman_tables[2].start, huffman_tables[2].length); |
| memcpy(huff_tab->chroma_ac, huffman_tables[3].start, huffman_tables[3].length); |
| |
| /* check scan header */ |
| for (i = 0; i < scan_header.num_components; i++) { |
| struct v4l2_jpeg_scan_component_spec *scan_component; |
| |
| scan_component = &scan_header.component[i]; |
| for (j = 0; j < header.frame.num_components; j++) { |
| if (header.frame.component[j].component_identifier == |
| scan_component->component_selector) |
| break; |
| } |
| if (j == header.frame.num_components) |
| continue; |
| |
| ctx->params.jpeg_huff_dc_index[j] = |
| scan_component->dc_entropy_coding_table_selector; |
| ctx->params.jpeg_huff_ac_index[j] = |
| scan_component->ac_entropy_coding_table_selector; |
| } |
| |
| /* Generate Huffman table information */ |
| for (i = 0; i < 4; i++) |
| coda9_jpeg_gen_dec_huff_tab(ctx, i); |
| |
| /* start of entropy coded segment */ |
| ctx->jpeg_ecs_offset = header.ecs_offset; |
| |
| switch (header.frame.subsampling) { |
| case V4L2_JPEG_CHROMA_SUBSAMPLING_420: |
| case V4L2_JPEG_CHROMA_SUBSAMPLING_422: |
| ctx->params.jpeg_chroma_subsampling = header.frame.subsampling; |
| break; |
| default: |
| v4l2_err(&dev->v4l2_dev, "chroma subsampling not supported: %d", |
| header.frame.subsampling); |
| return -EINVAL; |
| } |
| |
| return 0; |
| } |
| |
| static inline void coda9_jpeg_write_huff_values(struct coda_dev *dev, u8 *bits, |
| int num_values) |
| { |
| s8 *values = (s8 *)(bits + 16); |
| int huff_length, i; |
| |
| for (huff_length = 0, i = 0; i < 16; i++) |
| huff_length += bits[i]; |
| for (i = huff_length; i < num_values; i++) |
| values[i] = -1; |
| for (i = 0; i < num_values; i++) |
| coda_write(dev, (s32)values[i], CODA9_REG_JPEG_HUFF_DATA); |
| } |
| |
| static int coda9_jpeg_dec_huff_setup(struct coda_ctx *ctx) |
| { |
| struct coda_huff_tab *huff_tab = ctx->params.jpeg_huff_tab; |
| struct coda_dev *dev = ctx->dev; |
| s16 *huff_min = huff_tab->min; |
| s16 *huff_max = huff_tab->max; |
| s8 *huff_ptr = huff_tab->ptr; |
| int i; |
| |
| /* MIN Tables */ |
| coda_write(dev, 0x003, CODA9_REG_JPEG_HUFF_CTRL); |
| coda_write(dev, 0x000, CODA9_REG_JPEG_HUFF_ADDR); |
| for (i = 0; i < 4 * 16; i++) |
| coda_write(dev, (s32)huff_min[i], CODA9_REG_JPEG_HUFF_DATA); |
| |
| /* MAX Tables */ |
| coda_write(dev, 0x403, CODA9_REG_JPEG_HUFF_CTRL); |
| coda_write(dev, 0x440, CODA9_REG_JPEG_HUFF_ADDR); |
| for (i = 0; i < 4 * 16; i++) |
| coda_write(dev, (s32)huff_max[i], CODA9_REG_JPEG_HUFF_DATA); |
| |
| /* PTR Tables */ |
| coda_write(dev, 0x803, CODA9_REG_JPEG_HUFF_CTRL); |
| coda_write(dev, 0x880, CODA9_REG_JPEG_HUFF_ADDR); |
| for (i = 0; i < 4 * 16; i++) |
| coda_write(dev, (s32)huff_ptr[i], CODA9_REG_JPEG_HUFF_DATA); |
| |
| /* VAL Tables: DC Luma, DC Chroma, AC Luma, AC Chroma */ |
| coda_write(dev, 0xc03, CODA9_REG_JPEG_HUFF_CTRL); |
| coda9_jpeg_write_huff_values(dev, huff_tab->luma_dc, 12); |
| coda9_jpeg_write_huff_values(dev, huff_tab->chroma_dc, 12); |
| coda9_jpeg_write_huff_values(dev, huff_tab->luma_ac, 162); |
| coda9_jpeg_write_huff_values(dev, huff_tab->chroma_ac, 162); |
| coda_write(dev, 0x000, CODA9_REG_JPEG_HUFF_CTRL); |
| return 0; |
| } |
| |
| static inline void coda9_jpeg_write_qmat_tab(struct coda_dev *dev, |
| u8 *qmat, int index) |
| { |
| int i; |
| |
| coda_write(dev, index | 0x3, CODA9_REG_JPEG_QMAT_CTRL); |
| for (i = 0; i < 64; i++) |
| coda_write(dev, qmat[i], CODA9_REG_JPEG_QMAT_DATA); |
| coda_write(dev, 0, CODA9_REG_JPEG_QMAT_CTRL); |
| } |
| |
| static void coda9_jpeg_qmat_setup(struct coda_ctx *ctx) |
| { |
| struct coda_dev *dev = ctx->dev; |
| int *qmat_index = ctx->params.jpeg_qmat_index; |
| u8 **qmat_tab = ctx->params.jpeg_qmat_tab; |
| |
| coda9_jpeg_write_qmat_tab(dev, qmat_tab[qmat_index[0]], 0x00); |
| coda9_jpeg_write_qmat_tab(dev, qmat_tab[qmat_index[1]], 0x40); |
| coda9_jpeg_write_qmat_tab(dev, qmat_tab[qmat_index[2]], 0x80); |
| } |
| |
| static void coda9_jpeg_dec_bbc_gbu_setup(struct coda_ctx *ctx, |
| struct vb2_buffer *buf, u32 ecs_offset) |
| { |
| struct coda_dev *dev = ctx->dev; |
| int page_ptr, word_ptr, bit_ptr; |
| u32 bbc_base_addr, end_addr; |
| int bbc_cur_pos; |
| int ret, val; |
| |
| bbc_base_addr = vb2_dma_contig_plane_dma_addr(buf, 0); |
| end_addr = bbc_base_addr + vb2_get_plane_payload(buf, 0); |
| |
| page_ptr = ecs_offset / 256; |
| word_ptr = (ecs_offset % 256) / 4; |
| if (page_ptr & 1) |
| word_ptr += 64; |
| bit_ptr = (ecs_offset % 4) * 8; |
| if (word_ptr & 1) |
| bit_ptr += 32; |
| word_ptr &= ~0x1; |
| |
| coda_write(dev, end_addr, CODA9_REG_JPEG_BBC_WR_PTR); |
| coda_write(dev, bbc_base_addr, CODA9_REG_JPEG_BBC_BAS_ADDR); |
| |
| /* Leave 3 256-byte page margin to avoid a BBC interrupt */ |
| coda_write(dev, end_addr + 256 * 3 + 256, CODA9_REG_JPEG_BBC_END_ADDR); |
| val = DIV_ROUND_UP(vb2_plane_size(buf, 0), 256) + 3; |
| coda_write(dev, BIT(31) | val, CODA9_REG_JPEG_BBC_STRM_CTRL); |
| |
| bbc_cur_pos = page_ptr; |
| coda_write(dev, bbc_cur_pos, CODA9_REG_JPEG_BBC_CUR_POS); |
| coda_write(dev, bbc_base_addr + (bbc_cur_pos << 8), |
| CODA9_REG_JPEG_BBC_EXT_ADDR); |
| coda_write(dev, (bbc_cur_pos & 1) << 6, CODA9_REG_JPEG_BBC_INT_ADDR); |
| coda_write(dev, 64, CODA9_REG_JPEG_BBC_DATA_CNT); |
| coda_write(dev, 0, CODA9_REG_JPEG_BBC_COMMAND); |
| do { |
| ret = coda_read(dev, CODA9_REG_JPEG_BBC_BUSY); |
| } while (ret == 1); |
| |
| bbc_cur_pos++; |
| coda_write(dev, bbc_cur_pos, CODA9_REG_JPEG_BBC_CUR_POS); |
| coda_write(dev, bbc_base_addr + (bbc_cur_pos << 8), |
| CODA9_REG_JPEG_BBC_EXT_ADDR); |
| coda_write(dev, (bbc_cur_pos & 1) << 6, CODA9_REG_JPEG_BBC_INT_ADDR); |
| coda_write(dev, 64, CODA9_REG_JPEG_BBC_DATA_CNT); |
| coda_write(dev, 0, CODA9_REG_JPEG_BBC_COMMAND); |
| do { |
| ret = coda_read(dev, CODA9_REG_JPEG_BBC_BUSY); |
| } while (ret == 1); |
| |
| bbc_cur_pos++; |
| coda_write(dev, bbc_cur_pos, CODA9_REG_JPEG_BBC_CUR_POS); |
| coda_write(dev, 1, CODA9_REG_JPEG_BBC_CTRL); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_TT_CNT); |
| coda_write(dev, word_ptr, CODA9_REG_JPEG_GBU_WD_PTR); |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBSR); |
| coda_write(dev, 127, CODA9_REG_JPEG_GBU_BBER); |
| if (page_ptr & 1) { |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBIR); |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBHR); |
| } else { |
| coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBIR); |
| coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBHR); |
| } |
| coda_write(dev, 4, CODA9_REG_JPEG_GBU_CTRL); |
| coda_write(dev, bit_ptr, CODA9_REG_JPEG_GBU_FF_RPTR); |
| coda_write(dev, 3, CODA9_REG_JPEG_GBU_CTRL); |
| } |
| |
| static const int bus_req_num[] = { |
| [CODA9_JPEG_FORMAT_420] = 2, |
| [CODA9_JPEG_FORMAT_422] = 3, |
| [CODA9_JPEG_FORMAT_224] = 3, |
| [CODA9_JPEG_FORMAT_444] = 4, |
| [CODA9_JPEG_FORMAT_400] = 4, |
| }; |
| |
| #define MCU_INFO(mcu_block_num, comp_num, comp0_info, comp1_info, comp2_info) \ |
| (((mcu_block_num) << CODA9_JPEG_MCU_BLOCK_NUM_OFFSET) | \ |
| ((comp_num) << CODA9_JPEG_COMP_NUM_OFFSET) | \ |
| ((comp0_info) << CODA9_JPEG_COMP0_INFO_OFFSET) | \ |
| ((comp1_info) << CODA9_JPEG_COMP1_INFO_OFFSET) | \ |
| ((comp2_info) << CODA9_JPEG_COMP2_INFO_OFFSET)) |
| |
| static const u32 mcu_info[] = { |
| [CODA9_JPEG_FORMAT_420] = MCU_INFO(6, 3, 10, 5, 5), |
| [CODA9_JPEG_FORMAT_422] = MCU_INFO(4, 3, 9, 5, 5), |
| [CODA9_JPEG_FORMAT_224] = MCU_INFO(4, 3, 6, 5, 5), |
| [CODA9_JPEG_FORMAT_444] = MCU_INFO(3, 3, 5, 5, 5), |
| [CODA9_JPEG_FORMAT_400] = MCU_INFO(1, 1, 5, 0, 0), |
| }; |
| |
| /* |
| * Convert Huffman table specifcations to tables of codes and code lengths. |
| * For reference, see JPEG ITU-T.81 (ISO/IEC 10918-1) [1] |
| * |
| * [1] https://www.w3.org/Graphics/JPEG/itu-t81.pdf |
| */ |
| static int coda9_jpeg_gen_enc_huff_tab(struct coda_ctx *ctx, int tab_num, |
| int *ehufsi, int *ehufco) |
| { |
| int i, j, k, lastk, si, code, maxsymbol; |
| const u8 *bits, *huffval; |
| struct { |
| int size[256]; |
| int code[256]; |
| } *huff; |
| static const unsigned char *huff_tabs[4] = { |
| luma_dc, luma_ac, chroma_dc, chroma_ac, |
| }; |
| int ret = -EINVAL; |
| |
| huff = kzalloc(sizeof(*huff), GFP_KERNEL); |
| if (!huff) |
| return -ENOMEM; |
| |
| bits = huff_tabs[tab_num]; |
| huffval = huff_tabs[tab_num] + 16; |
| |
| maxsymbol = tab_num & 1 ? 256 : 16; |
| |
| /* Figure C.1 - Generation of table of Huffman code sizes */ |
| k = 0; |
| for (i = 1; i <= 16; i++) { |
| j = bits[i - 1]; |
| if (k + j > maxsymbol) |
| goto out; |
| while (j--) |
| huff->size[k++] = i; |
| } |
| lastk = k; |
| |
| /* Figure C.2 - Generation of table of Huffman codes */ |
| k = 0; |
| code = 0; |
| si = huff->size[0]; |
| while (k < lastk) { |
| while (huff->size[k] == si) { |
| huff->code[k++] = code; |
| code++; |
| } |
| if (code >= (1 << si)) |
| goto out; |
| code <<= 1; |
| si++; |
| } |
| |
| /* Figure C.3 - Ordering procedure for encoding procedure code tables */ |
| for (k = 0; k < lastk; k++) { |
| i = huffval[k]; |
| if (i >= maxsymbol || ehufsi[i]) |
| goto out; |
| ehufco[i] = huff->code[k]; |
| ehufsi[i] = huff->size[k]; |
| } |
| |
| ret = 0; |
| out: |
| kfree(huff); |
| return ret; |
| } |
| |
| #define DC_TABLE_INDEX0 0 |
| #define AC_TABLE_INDEX0 1 |
| #define DC_TABLE_INDEX1 2 |
| #define AC_TABLE_INDEX1 3 |
| |
| static u8 *coda9_jpeg_get_huff_bits(struct coda_ctx *ctx, int tab_num) |
| { |
| struct coda_huff_tab *huff_tab = ctx->params.jpeg_huff_tab; |
| |
| if (!huff_tab) |
| return NULL; |
| |
| switch (tab_num) { |
| case DC_TABLE_INDEX0: return huff_tab->luma_dc; |
| case AC_TABLE_INDEX0: return huff_tab->luma_ac; |
| case DC_TABLE_INDEX1: return huff_tab->chroma_dc; |
| case AC_TABLE_INDEX1: return huff_tab->chroma_ac; |
| } |
| |
| return NULL; |
| } |
| |
| static int coda9_jpeg_gen_dec_huff_tab(struct coda_ctx *ctx, int tab_num) |
| { |
| int ptr_cnt = 0, huff_code = 0, zero_flag = 0, data_flag = 0; |
| u8 *huff_bits; |
| s16 *huff_max; |
| s16 *huff_min; |
| s8 *huff_ptr; |
| int ofs; |
| int i; |
| |
| huff_bits = coda9_jpeg_get_huff_bits(ctx, tab_num); |
| if (!huff_bits) |
| return -EINVAL; |
| |
| /* DC/AC Luma, DC/AC Chroma -> DC Luma/Chroma, AC Luma/Chroma */ |
| ofs = ((tab_num & 1) << 1) | ((tab_num >> 1) & 1); |
| ofs *= 16; |
| |
| huff_ptr = ctx->params.jpeg_huff_tab->ptr + ofs; |
| huff_max = ctx->params.jpeg_huff_tab->max + ofs; |
| huff_min = ctx->params.jpeg_huff_tab->min + ofs; |
| |
| for (i = 0; i < 16; i++) { |
| if (huff_bits[i]) { |
| huff_ptr[i] = ptr_cnt; |
| ptr_cnt += huff_bits[i]; |
| huff_min[i] = huff_code; |
| huff_max[i] = huff_code + (huff_bits[i] - 1); |
| data_flag = 1; |
| zero_flag = 0; |
| } else { |
| huff_ptr[i] = -1; |
| huff_min[i] = -1; |
| huff_max[i] = -1; |
| zero_flag = 1; |
| } |
| |
| if (data_flag == 1) { |
| if (zero_flag == 1) |
| huff_code <<= 1; |
| else |
| huff_code = (huff_max[i] + 1) << 1; |
| } |
| } |
| |
| return 0; |
| } |
| |
| static int coda9_jpeg_load_huff_tab(struct coda_ctx *ctx) |
| { |
| struct { |
| int size[4][256]; |
| int code[4][256]; |
| } *huff; |
| u32 *huff_data; |
| int i, j; |
| int ret; |
| |
| huff = kzalloc(sizeof(*huff), GFP_KERNEL); |
| if (!huff) |
| return -ENOMEM; |
| |
| /* Generate all four (luma/chroma DC/AC) code/size lookup tables */ |
| for (i = 0; i < 4; i++) { |
| ret = coda9_jpeg_gen_enc_huff_tab(ctx, i, huff->size[i], |
| huff->code[i]); |
| if (ret) |
| goto out; |
| } |
| |
| if (!ctx->params.jpeg_huff_data) { |
| ctx->params.jpeg_huff_data = |
| kzalloc(sizeof(u32) * CODA9_JPEG_ENC_HUFF_DATA_SIZE, |
| GFP_KERNEL); |
| if (!ctx->params.jpeg_huff_data) { |
| ret = -ENOMEM; |
| goto out; |
| } |
| } |
| huff_data = ctx->params.jpeg_huff_data; |
| |
| for (j = 0; j < 4; j++) { |
| /* Store Huffman lookup tables in AC0, AC1, DC0, DC1 order */ |
| int t = (j == 0) ? AC_TABLE_INDEX0 : |
| (j == 1) ? AC_TABLE_INDEX1 : |
| (j == 2) ? DC_TABLE_INDEX0 : |
| DC_TABLE_INDEX1; |
| /* DC tables only have 16 entries */ |
| int len = (j < 2) ? 256 : 16; |
| |
| for (i = 0; i < len; i++) { |
| if (huff->size[t][i] == 0 && huff->code[t][i] == 0) |
| *(huff_data++) = 0; |
| else |
| *(huff_data++) = |
| ((huff->size[t][i] - 1) << 16) | |
| huff->code[t][i]; |
| } |
| } |
| |
| ret = 0; |
| out: |
| kfree(huff); |
| return ret; |
| } |
| |
| static void coda9_jpeg_write_huff_tab(struct coda_ctx *ctx) |
| { |
| struct coda_dev *dev = ctx->dev; |
| u32 *huff_data = ctx->params.jpeg_huff_data; |
| int i; |
| |
| /* Write Huffman size/code lookup tables in AC0, AC1, DC0, DC1 order */ |
| coda_write(dev, 0x3, CODA9_REG_JPEG_HUFF_CTRL); |
| for (i = 0; i < CODA9_JPEG_ENC_HUFF_DATA_SIZE; i++) |
| coda_write(dev, *(huff_data++), CODA9_REG_JPEG_HUFF_DATA); |
| coda_write(dev, 0x0, CODA9_REG_JPEG_HUFF_CTRL); |
| } |
| |
| static inline void coda9_jpeg_write_qmat_quotients(struct coda_dev *dev, |
| u8 *qmat, int index) |
| { |
| int i; |
| |
| coda_write(dev, index | 0x3, CODA9_REG_JPEG_QMAT_CTRL); |
| for (i = 0; i < 64; i++) |
| coda_write(dev, 0x80000 / qmat[i], CODA9_REG_JPEG_QMAT_DATA); |
| coda_write(dev, index, CODA9_REG_JPEG_QMAT_CTRL); |
| } |
| |
| static void coda9_jpeg_load_qmat_tab(struct coda_ctx *ctx) |
| { |
| struct coda_dev *dev = ctx->dev; |
| u8 *luma_tab; |
| u8 *chroma_tab; |
| |
| luma_tab = ctx->params.jpeg_qmat_tab[0]; |
| if (!luma_tab) |
| luma_tab = luma_q; |
| |
| chroma_tab = ctx->params.jpeg_qmat_tab[1]; |
| if (!chroma_tab) |
| chroma_tab = chroma_q; |
| |
| coda9_jpeg_write_qmat_quotients(dev, luma_tab, 0x00); |
| coda9_jpeg_write_qmat_quotients(dev, chroma_tab, 0x40); |
| coda9_jpeg_write_qmat_quotients(dev, chroma_tab, 0x80); |
| } |
| |
| struct coda_jpeg_stream { |
| u8 *curr; |
| u8 *end; |
| }; |
| |
| static inline int coda_jpeg_put_byte(u8 byte, struct coda_jpeg_stream *stream) |
| { |
| if (stream->curr >= stream->end) |
| return -EINVAL; |
| |
| *stream->curr++ = byte; |
| |
| return 0; |
| } |
| |
| static inline int coda_jpeg_put_word(u16 word, struct coda_jpeg_stream *stream) |
| { |
| if (stream->curr + sizeof(__be16) > stream->end) |
| return -EINVAL; |
| |
| put_unaligned_be16(word, stream->curr); |
| stream->curr += sizeof(__be16); |
| |
| return 0; |
| } |
| |
| static int coda_jpeg_put_table(u16 marker, u8 index, const u8 *table, |
| size_t len, struct coda_jpeg_stream *stream) |
| { |
| int i, ret; |
| |
| ret = coda_jpeg_put_word(marker, stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_word(3 + len, stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_byte(index, stream); |
| for (i = 0; i < len && ret == 0; i++) |
| ret = coda_jpeg_put_byte(table[i], stream); |
| |
| return ret; |
| } |
| |
| static int coda_jpeg_define_quantization_table(struct coda_ctx *ctx, u8 index, |
| struct coda_jpeg_stream *stream) |
| { |
| return coda_jpeg_put_table(DQT_MARKER, index, |
| ctx->params.jpeg_qmat_tab[index], 64, |
| stream); |
| } |
| |
| static int coda_jpeg_define_huffman_table(u8 index, const u8 *table, size_t len, |
| struct coda_jpeg_stream *stream) |
| { |
| return coda_jpeg_put_table(DHT_MARKER, index, table, len, stream); |
| } |
| |
| static int coda9_jpeg_encode_header(struct coda_ctx *ctx, int len, u8 *buf) |
| { |
| struct coda_jpeg_stream stream = { buf, buf + len }; |
| struct coda_q_data *q_data_src; |
| int chroma_format, comp_num; |
| int i, ret, pad; |
| |
| q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT); |
| chroma_format = coda9_jpeg_chroma_format(q_data_src->fourcc); |
| if (chroma_format < 0) |
| return 0; |
| |
| /* Start Of Image */ |
| ret = coda_jpeg_put_word(SOI_MARKER, &stream); |
| if (ret < 0) |
| return ret; |
| |
| /* Define Restart Interval */ |
| if (ctx->params.jpeg_restart_interval) { |
| ret = coda_jpeg_put_word(DRI_MARKER, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_word(4, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_word(ctx->params.jpeg_restart_interval, |
| &stream); |
| if (ret < 0) |
| return ret; |
| } |
| |
| /* Define Quantization Tables */ |
| ret = coda_jpeg_define_quantization_table(ctx, 0x00, &stream); |
| if (ret < 0) |
| return ret; |
| if (chroma_format != CODA9_JPEG_FORMAT_400) { |
| ret = coda_jpeg_define_quantization_table(ctx, 0x01, &stream); |
| if (ret < 0) |
| return ret; |
| } |
| |
| /* Define Huffman Tables */ |
| ret = coda_jpeg_define_huffman_table(0x00, luma_dc, 16 + 12, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_define_huffman_table(0x10, luma_ac, 16 + 162, &stream); |
| if (ret < 0) |
| return ret; |
| if (chroma_format != CODA9_JPEG_FORMAT_400) { |
| ret = coda_jpeg_define_huffman_table(0x01, chroma_dc, 16 + 12, |
| &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_define_huffman_table(0x11, chroma_ac, 16 + 162, |
| &stream); |
| if (ret < 0) |
| return ret; |
| } |
| |
| /* Start Of Frame */ |
| ret = coda_jpeg_put_word(SOF_MARKER, &stream); |
| if (ret < 0) |
| return ret; |
| comp_num = (chroma_format == CODA9_JPEG_FORMAT_400) ? 1 : 3; |
| ret = coda_jpeg_put_word(8 + comp_num * 3, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_byte(0x08, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_word(q_data_src->height, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_word(q_data_src->width, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_byte(comp_num, &stream); |
| if (ret < 0) |
| return ret; |
| for (i = 0; i < comp_num; i++) { |
| static unsigned char subsampling[5][3] = { |
| [CODA9_JPEG_FORMAT_420] = { 0x22, 0x11, 0x11 }, |
| [CODA9_JPEG_FORMAT_422] = { 0x21, 0x11, 0x11 }, |
| [CODA9_JPEG_FORMAT_224] = { 0x12, 0x11, 0x11 }, |
| [CODA9_JPEG_FORMAT_444] = { 0x11, 0x11, 0x11 }, |
| [CODA9_JPEG_FORMAT_400] = { 0x11 }, |
| }; |
| |
| /* Component identifier, matches SOS */ |
| ret = coda_jpeg_put_byte(i + 1, &stream); |
| if (ret < 0) |
| return ret; |
| ret = coda_jpeg_put_byte(subsampling[chroma_format][i], |
| &stream); |
| if (ret < 0) |
| return ret; |
| /* Chroma table index */ |
| ret = coda_jpeg_put_byte((i == 0) ? 0 : 1, &stream); |
| if (ret < 0) |
| return ret; |
| } |
| |
| /* Pad to multiple of 8 bytes */ |
| pad = (stream.curr - buf) % 8; |
| if (pad) { |
| pad = 8 - pad; |
| while (pad--) { |
| ret = coda_jpeg_put_byte(0x00, &stream); |
| if (ret < 0) |
| return ret; |
| } |
| } |
| |
| return stream.curr - buf; |
| } |
| |
| /* |
| * Scale quantization table using nonlinear scaling factor |
| * u8 qtab[64], scale [50,190] |
| */ |
| static void coda_scale_quant_table(u8 *q_tab, int scale) |
| { |
| unsigned int temp; |
| int i; |
| |
| for (i = 0; i < 64; i++) { |
| temp = DIV_ROUND_CLOSEST((unsigned int)q_tab[i] * scale, 100); |
| if (temp <= 0) |
| temp = 1; |
| if (temp > 255) |
| temp = 255; |
| q_tab[i] = (unsigned char)temp; |
| } |
| } |
| |
| void coda_set_jpeg_compression_quality(struct coda_ctx *ctx, int quality) |
| { |
| unsigned int scale; |
| |
| ctx->params.jpeg_quality = quality; |
| |
| /* Clip quality setting to [5,100] interval */ |
| if (quality > 100) |
| quality = 100; |
| if (quality < 5) |
| quality = 5; |
| |
| /* |
| * Non-linear scaling factor: |
| * [5,50] -> [1000..100], [51,100] -> [98..0] |
| */ |
| if (quality < 50) |
| scale = 5000 / quality; |
| else |
| scale = 200 - 2 * quality; |
| |
| if (ctx->params.jpeg_qmat_tab[0]) { |
| memcpy(ctx->params.jpeg_qmat_tab[0], luma_q, 64); |
| coda_scale_quant_table(ctx->params.jpeg_qmat_tab[0], scale); |
| } |
| if (ctx->params.jpeg_qmat_tab[1]) { |
| memcpy(ctx->params.jpeg_qmat_tab[1], chroma_q, 64); |
| coda_scale_quant_table(ctx->params.jpeg_qmat_tab[1], scale); |
| } |
| } |
| |
| /* |
| * Encoder context operations |
| */ |
| |
| static int coda9_jpeg_start_encoding(struct coda_ctx *ctx) |
| { |
| struct coda_dev *dev = ctx->dev; |
| int ret; |
| |
| ret = coda9_jpeg_load_huff_tab(ctx); |
| if (ret < 0) { |
| v4l2_err(&dev->v4l2_dev, "error loading Huffman tables\n"); |
| return ret; |
| } |
| if (!ctx->params.jpeg_qmat_tab[0]) |
| ctx->params.jpeg_qmat_tab[0] = kmalloc(64, GFP_KERNEL); |
| if (!ctx->params.jpeg_qmat_tab[1]) |
| ctx->params.jpeg_qmat_tab[1] = kmalloc(64, GFP_KERNEL); |
| coda_set_jpeg_compression_quality(ctx, ctx->params.jpeg_quality); |
| |
| return 0; |
| } |
| |
| static int coda9_jpeg_prepare_encode(struct coda_ctx *ctx) |
| { |
| struct coda_q_data *q_data_src; |
| struct vb2_v4l2_buffer *src_buf, *dst_buf; |
| struct coda_dev *dev = ctx->dev; |
| u32 start_addr, end_addr; |
| u16 aligned_width, aligned_height; |
| bool chroma_interleave; |
| int chroma_format; |
| int header_len; |
| int ret; |
| ktime_t timeout; |
| |
| src_buf = v4l2_m2m_next_src_buf(ctx->fh.m2m_ctx); |
| dst_buf = v4l2_m2m_next_dst_buf(ctx->fh.m2m_ctx); |
| q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT); |
| |
| if (vb2_get_plane_payload(&src_buf->vb2_buf, 0) == 0) |
| vb2_set_plane_payload(&src_buf->vb2_buf, 0, |
| vb2_plane_size(&src_buf->vb2_buf, 0)); |
| |
| src_buf->sequence = ctx->osequence; |
| dst_buf->sequence = ctx->osequence; |
| ctx->osequence++; |
| |
| src_buf->flags |= V4L2_BUF_FLAG_KEYFRAME; |
| src_buf->flags &= ~V4L2_BUF_FLAG_PFRAME; |
| |
| coda_set_gdi_regs(ctx); |
| |
| start_addr = vb2_dma_contig_plane_dma_addr(&dst_buf->vb2_buf, 0); |
| end_addr = start_addr + vb2_plane_size(&dst_buf->vb2_buf, 0); |
| |
| chroma_format = coda9_jpeg_chroma_format(q_data_src->fourcc); |
| if (chroma_format < 0) |
| return chroma_format; |
| |
| /* Round image dimensions to multiple of MCU size */ |
| aligned_width = round_up(q_data_src->width, width_align[chroma_format]); |
| aligned_height = round_up(q_data_src->height, |
| height_align[chroma_format]); |
| if (aligned_width != q_data_src->bytesperline) { |
| v4l2_err(&dev->v4l2_dev, "wrong stride: %d instead of %d\n", |
| aligned_width, q_data_src->bytesperline); |
| } |
| |
| header_len = |
| coda9_jpeg_encode_header(ctx, |
| vb2_plane_size(&dst_buf->vb2_buf, 0), |
| vb2_plane_vaddr(&dst_buf->vb2_buf, 0)); |
| if (header_len < 0) |
| return header_len; |
| |
| coda_write(dev, start_addr + header_len, CODA9_REG_JPEG_BBC_BAS_ADDR); |
| coda_write(dev, end_addr, CODA9_REG_JPEG_BBC_END_ADDR); |
| coda_write(dev, start_addr + header_len, CODA9_REG_JPEG_BBC_WR_PTR); |
| coda_write(dev, start_addr + header_len, CODA9_REG_JPEG_BBC_RD_PTR); |
| coda_write(dev, 0, CODA9_REG_JPEG_BBC_CUR_POS); |
| /* 64 words per 256-byte page */ |
| coda_write(dev, 64, CODA9_REG_JPEG_BBC_DATA_CNT); |
| coda_write(dev, start_addr, CODA9_REG_JPEG_BBC_EXT_ADDR); |
| coda_write(dev, 0, CODA9_REG_JPEG_BBC_INT_ADDR); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_BT_PTR); |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_WD_PTR); |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_BBSR); |
| coda_write(dev, BIT(31) | ((end_addr - start_addr - header_len) / 256), |
| CODA9_REG_JPEG_BBC_STRM_CTRL); |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_CTRL); |
| coda_write(dev, 0, CODA9_REG_JPEG_GBU_FF_RPTR); |
| coda_write(dev, 127, CODA9_REG_JPEG_GBU_BBER); |
| coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBIR); |
| coda_write(dev, 64, CODA9_REG_JPEG_GBU_BBHR); |
| |
| chroma_interleave = (q_data_src->fourcc == V4L2_PIX_FMT_NV12); |
| coda_write(dev, CODA9_JPEG_PIC_CTRL_TC_DIRECTION | |
| CODA9_JPEG_PIC_CTRL_ENCODER_EN, CODA9_REG_JPEG_PIC_CTRL); |
| coda_write(dev, 0, CODA9_REG_JPEG_SCL_INFO); |
| coda_write(dev, chroma_interleave, CODA9_REG_JPEG_DPB_CONFIG); |
| coda_write(dev, ctx->params.jpeg_restart_interval, |
| CODA9_REG_JPEG_RST_INTVAL); |
| coda_write(dev, 1, CODA9_REG_JPEG_BBC_CTRL); |
| |
| coda_write(dev, bus_req_num[chroma_format], CODA9_REG_JPEG_OP_INFO); |
| |
| coda9_jpeg_write_huff_tab(ctx); |
| coda9_jpeg_load_qmat_tab(ctx); |
| |
| if (ctx->params.rot_mode & CODA_ROT_90) { |
| aligned_width = aligned_height; |
| aligned_height = q_data_src->bytesperline; |
| if (chroma_format == CODA9_JPEG_FORMAT_422) |
| chroma_format = CODA9_JPEG_FORMAT_224; |
| else if (chroma_format == CODA9_JPEG_FORMAT_224) |
| chroma_format = CODA9_JPEG_FORMAT_422; |
| } |
| /* These need to be multiples of MCU size */ |
| coda_write(dev, aligned_width << 16 | aligned_height, |
| CODA9_REG_JPEG_PIC_SIZE); |
| coda_write(dev, ctx->params.rot_mode ? |
| (CODA_ROT_MIR_ENABLE | ctx->params.rot_mode) : 0, |
| CODA9_REG_JPEG_ROT_INFO); |
| |
| coda_write(dev, mcu_info[chroma_format], CODA9_REG_JPEG_MCU_INFO); |
| |
| coda_write(dev, 1, CODA9_GDI_CONTROL); |
| timeout = ktime_add_us(ktime_get(), 100000); |
| do { |
| ret = coda_read(dev, CODA9_GDI_STATUS); |
| if (ktime_compare(ktime_get(), timeout) > 0) { |
| v4l2_err(&dev->v4l2_dev, "timeout waiting for GDI\n"); |
| return -ETIMEDOUT; |
| } |
| } while (!ret); |
| |
| coda_write(dev, (chroma_format << 17) | (chroma_interleave << 16) | |
| q_data_src->bytesperline, CODA9_GDI_INFO_CONTROL); |
| /* The content of this register seems to be irrelevant: */ |
| coda_write(dev, aligned_width << 16 | aligned_height, |
| CODA9_GDI_INFO_PIC_SIZE); |
| |
| coda_write_base(ctx, q_data_src, src_buf, CODA9_GDI_INFO_BASE_Y); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_DPB_BASE00); |
| coda_write(dev, 0, CODA9_GDI_CONTROL); |
| coda_write(dev, 1, CODA9_GDI_PIC_INIT_HOST); |
| |
| coda_write(dev, 1, CODA9_GDI_WPROT_ERR_CLR); |
| coda_write(dev, 0, CODA9_GDI_WPROT_RGN_EN); |
| |
| trace_coda_jpeg_run(ctx, src_buf); |
| |
| coda_write(dev, 1, CODA9_REG_JPEG_PIC_START); |
| |
| return 0; |
| } |
| |
| static void coda9_jpeg_finish_encode(struct coda_ctx *ctx) |
| { |
| struct vb2_v4l2_buffer *src_buf, *dst_buf; |
| struct coda_dev *dev = ctx->dev; |
| u32 wr_ptr, start_ptr; |
| u32 err_mb; |
| |
| if (ctx->aborting) { |
| coda_write(ctx->dev, 0, CODA9_REG_JPEG_BBC_FLUSH_CMD); |
| return; |
| } |
| |
| /* |
| * Lock to make sure that an encoder stop command running in parallel |
| * will either already have marked src_buf as last, or it will wake up |
| * the capture queue after the buffers are returned. |
| */ |
| mutex_lock(&ctx->wakeup_mutex); |
| src_buf = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx); |
| dst_buf = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx); |
| |
| trace_coda_jpeg_done(ctx, dst_buf); |
| |
| /* |
| * Set plane payload to the number of bytes written out |
| * by the JPEG processing unit |
| */ |
| start_ptr = vb2_dma_contig_plane_dma_addr(&dst_buf->vb2_buf, 0); |
| wr_ptr = coda_read(dev, CODA9_REG_JPEG_BBC_WR_PTR); |
| vb2_set_plane_payload(&dst_buf->vb2_buf, 0, wr_ptr - start_ptr); |
| |
| err_mb = coda_read(dev, CODA9_REG_JPEG_PIC_ERRMB); |
| if (err_mb) |
| coda_dbg(1, ctx, "ERRMB: 0x%x\n", err_mb); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_BBC_FLUSH_CMD); |
| |
| dst_buf->flags &= ~(V4L2_BUF_FLAG_PFRAME | V4L2_BUF_FLAG_LAST); |
| dst_buf->flags |= V4L2_BUF_FLAG_KEYFRAME; |
| dst_buf->flags |= src_buf->flags & V4L2_BUF_FLAG_LAST; |
| |
| v4l2_m2m_buf_copy_metadata(src_buf, dst_buf, false); |
| |
| v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_DONE); |
| coda_m2m_buf_done(ctx, dst_buf, err_mb ? VB2_BUF_STATE_ERROR : |
| VB2_BUF_STATE_DONE); |
| mutex_unlock(&ctx->wakeup_mutex); |
| |
| coda_dbg(1, ctx, "job finished: encoded frame (%u)%s\n", |
| dst_buf->sequence, |
| (dst_buf->flags & V4L2_BUF_FLAG_LAST) ? " (last)" : ""); |
| |
| /* |
| * Reset JPEG processing unit after each encode run to work |
| * around hangups when switching context between encoder and |
| * decoder. |
| */ |
| coda_hw_reset(ctx); |
| } |
| |
| static void coda9_jpeg_encode_timeout(struct coda_ctx *ctx) |
| { |
| struct coda_dev *dev = ctx->dev; |
| u32 end_addr, wr_ptr; |
| |
| /* Handle missing BBC overflow interrupt via timeout */ |
| end_addr = coda_read(dev, CODA9_REG_JPEG_BBC_END_ADDR); |
| wr_ptr = coda_read(dev, CODA9_REG_JPEG_BBC_WR_PTR); |
| if (wr_ptr >= end_addr - 256) { |
| v4l2_err(&dev->v4l2_dev, "JPEG too large for capture buffer\n"); |
| coda9_jpeg_finish_encode(ctx); |
| return; |
| } |
| |
| coda_hw_reset(ctx); |
| } |
| |
| static void coda9_jpeg_release(struct coda_ctx *ctx) |
| { |
| int i; |
| |
| if (ctx->params.jpeg_qmat_tab[0] == luma_q) |
| ctx->params.jpeg_qmat_tab[0] = NULL; |
| if (ctx->params.jpeg_qmat_tab[1] == chroma_q) |
| ctx->params.jpeg_qmat_tab[1] = NULL; |
| for (i = 0; i < 3; i++) |
| kfree(ctx->params.jpeg_qmat_tab[i]); |
| kfree(ctx->params.jpeg_huff_data); |
| kfree(ctx->params.jpeg_huff_tab); |
| } |
| |
| const struct coda_context_ops coda9_jpeg_encode_ops = { |
| .queue_init = coda_encoder_queue_init, |
| .start_streaming = coda9_jpeg_start_encoding, |
| .prepare_run = coda9_jpeg_prepare_encode, |
| .finish_run = coda9_jpeg_finish_encode, |
| .run_timeout = coda9_jpeg_encode_timeout, |
| .release = coda9_jpeg_release, |
| }; |
| |
| /* |
| * Decoder context operations |
| */ |
| |
| static int coda9_jpeg_start_decoding(struct coda_ctx *ctx) |
| { |
| ctx->params.jpeg_qmat_index[0] = 0; |
| ctx->params.jpeg_qmat_index[1] = 1; |
| ctx->params.jpeg_qmat_index[2] = 1; |
| ctx->params.jpeg_qmat_tab[0] = luma_q; |
| ctx->params.jpeg_qmat_tab[1] = chroma_q; |
| /* nothing more to do here */ |
| |
| /* TODO: we could already scan the first header to get the chroma |
| * format. |
| */ |
| |
| return 0; |
| } |
| |
| static int coda9_jpeg_prepare_decode(struct coda_ctx *ctx) |
| { |
| struct coda_dev *dev = ctx->dev; |
| int aligned_width, aligned_height; |
| int chroma_format; |
| int ret; |
| u32 val, dst_fourcc; |
| struct coda_q_data *q_data_src, *q_data_dst; |
| struct vb2_v4l2_buffer *src_buf, *dst_buf; |
| int chroma_interleave; |
| int scl_hor_mode, scl_ver_mode; |
| |
| src_buf = v4l2_m2m_next_src_buf(ctx->fh.m2m_ctx); |
| dst_buf = v4l2_m2m_next_dst_buf(ctx->fh.m2m_ctx); |
| q_data_src = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT); |
| q_data_dst = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_CAPTURE); |
| dst_fourcc = q_data_dst->fourcc; |
| |
| scl_hor_mode = coda_jpeg_scale(q_data_src->width, q_data_dst->width); |
| scl_ver_mode = coda_jpeg_scale(q_data_src->height, q_data_dst->height); |
| |
| if (vb2_get_plane_payload(&src_buf->vb2_buf, 0) == 0) |
| vb2_set_plane_payload(&src_buf->vb2_buf, 0, |
| vb2_plane_size(&src_buf->vb2_buf, 0)); |
| |
| chroma_format = coda9_jpeg_chroma_format(q_data_dst->fourcc); |
| if (chroma_format < 0) |
| return chroma_format; |
| |
| ret = coda_jpeg_decode_header(ctx, &src_buf->vb2_buf); |
| if (ret < 0) { |
| src_buf = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx); |
| dst_buf = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx); |
| v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_DONE); |
| v4l2_m2m_buf_done(dst_buf, VB2_BUF_STATE_ERROR); |
| |
| return ret; |
| } |
| |
| /* Round image dimensions to multiple of MCU size */ |
| aligned_width = round_up(q_data_src->width, width_align[chroma_format]); |
| aligned_height = round_up(q_data_src->height, height_align[chroma_format]); |
| if (aligned_width != q_data_dst->bytesperline) { |
| v4l2_err(&dev->v4l2_dev, "stride mismatch: %d != %d\n", |
| aligned_width, q_data_dst->bytesperline); |
| } |
| |
| coda_set_gdi_regs(ctx); |
| |
| val = ctx->params.jpeg_huff_ac_index[0] << 12 | |
| ctx->params.jpeg_huff_ac_index[1] << 11 | |
| ctx->params.jpeg_huff_ac_index[2] << 10 | |
| ctx->params.jpeg_huff_dc_index[0] << 9 | |
| ctx->params.jpeg_huff_dc_index[1] << 8 | |
| ctx->params.jpeg_huff_dc_index[2] << 7; |
| if (ctx->params.jpeg_huff_tab) |
| val |= CODA9_JPEG_PIC_CTRL_USER_HUFFMAN_EN; |
| coda_write(dev, val, CODA9_REG_JPEG_PIC_CTRL); |
| |
| coda_write(dev, aligned_width << 16 | aligned_height, |
| CODA9_REG_JPEG_PIC_SIZE); |
| |
| chroma_interleave = (dst_fourcc == V4L2_PIX_FMT_NV12); |
| coda_write(dev, 0, CODA9_REG_JPEG_ROT_INFO); |
| coda_write(dev, bus_req_num[chroma_format], CODA9_REG_JPEG_OP_INFO); |
| coda_write(dev, mcu_info[chroma_format], CODA9_REG_JPEG_MCU_INFO); |
| if (scl_hor_mode || scl_ver_mode) |
| val = CODA9_JPEG_SCL_ENABLE | (scl_hor_mode << 2) | scl_ver_mode; |
| else |
| val = 0; |
| coda_write(dev, val, CODA9_REG_JPEG_SCL_INFO); |
| coda_write(dev, chroma_interleave, CODA9_REG_JPEG_DPB_CONFIG); |
| coda_write(dev, ctx->params.jpeg_restart_interval, |
| CODA9_REG_JPEG_RST_INTVAL); |
| |
| if (ctx->params.jpeg_huff_tab) { |
| ret = coda9_jpeg_dec_huff_setup(ctx); |
| if (ret < 0) { |
| v4l2_err(&dev->v4l2_dev, |
| "failed to set up Huffman tables: %d\n", ret); |
| return ret; |
| } |
| } |
| |
| coda9_jpeg_qmat_setup(ctx); |
| |
| coda9_jpeg_dec_bbc_gbu_setup(ctx, &src_buf->vb2_buf, |
| ctx->jpeg_ecs_offset); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_RST_INDEX); |
| coda_write(dev, 0, CODA9_REG_JPEG_RST_COUNT); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_DPCM_DIFF_Y); |
| coda_write(dev, 0, CODA9_REG_JPEG_DPCM_DIFF_CB); |
| coda_write(dev, 0, CODA9_REG_JPEG_DPCM_DIFF_CR); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_ROT_INFO); |
| |
| coda_write(dev, 1, CODA9_GDI_CONTROL); |
| do { |
| ret = coda_read(dev, CODA9_GDI_STATUS); |
| } while (!ret); |
| |
| val = (chroma_format << 17) | (chroma_interleave << 16) | |
| q_data_dst->bytesperline; |
| if (ctx->tiled_map_type == GDI_TILED_FRAME_MB_RASTER_MAP) |
| val |= 3 << 20; |
| coda_write(dev, val, CODA9_GDI_INFO_CONTROL); |
| |
| coda_write(dev, aligned_width << 16 | aligned_height, |
| CODA9_GDI_INFO_PIC_SIZE); |
| |
| coda_write_base(ctx, q_data_dst, dst_buf, CODA9_GDI_INFO_BASE_Y); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_DPB_BASE00); |
| coda_write(dev, 0, CODA9_GDI_CONTROL); |
| coda_write(dev, 1, CODA9_GDI_PIC_INIT_HOST); |
| |
| trace_coda_jpeg_run(ctx, src_buf); |
| |
| coda_write(dev, 1, CODA9_REG_JPEG_PIC_START); |
| |
| return 0; |
| } |
| |
| static void coda9_jpeg_finish_decode(struct coda_ctx *ctx) |
| { |
| struct coda_dev *dev = ctx->dev; |
| struct vb2_v4l2_buffer *dst_buf, *src_buf; |
| struct coda_q_data *q_data_dst; |
| u32 err_mb; |
| |
| err_mb = coda_read(dev, CODA9_REG_JPEG_PIC_ERRMB); |
| if (err_mb) |
| v4l2_err(&dev->v4l2_dev, "ERRMB: 0x%x\n", err_mb); |
| |
| coda_write(dev, 0, CODA9_REG_JPEG_BBC_FLUSH_CMD); |
| |
| /* |
| * Lock to make sure that a decoder stop command running in parallel |
| * will either already have marked src_buf as last, or it will wake up |
| * the capture queue after the buffers are returned. |
| */ |
| mutex_lock(&ctx->wakeup_mutex); |
| src_buf = v4l2_m2m_src_buf_remove(ctx->fh.m2m_ctx); |
| dst_buf = v4l2_m2m_dst_buf_remove(ctx->fh.m2m_ctx); |
| dst_buf->sequence = ctx->osequence++; |
| |
| trace_coda_jpeg_done(ctx, dst_buf); |
| |
| dst_buf->flags &= ~(V4L2_BUF_FLAG_PFRAME | V4L2_BUF_FLAG_LAST); |
| dst_buf->flags |= V4L2_BUF_FLAG_KEYFRAME; |
| dst_buf->flags |= src_buf->flags & V4L2_BUF_FLAG_LAST; |
| |
| v4l2_m2m_buf_copy_metadata(src_buf, dst_buf, false); |
| |
| q_data_dst = get_q_data(ctx, V4L2_BUF_TYPE_VIDEO_CAPTURE); |
| vb2_set_plane_payload(&dst_buf->vb2_buf, 0, q_data_dst->sizeimage); |
| |
| v4l2_m2m_buf_done(src_buf, VB2_BUF_STATE_DONE); |
| coda_m2m_buf_done(ctx, dst_buf, err_mb ? VB2_BUF_STATE_ERROR : |
| VB2_BUF_STATE_DONE); |
| |
| mutex_unlock(&ctx->wakeup_mutex); |
| |
| coda_dbg(1, ctx, "job finished: decoded frame (%u)%s\n", |
| dst_buf->sequence, |
| (dst_buf->flags & V4L2_BUF_FLAG_LAST) ? " (last)" : ""); |
| |
| /* |
| * Reset JPEG processing unit after each decode run to work |
| * around hangups when switching context between encoder and |
| * decoder. |
| */ |
| coda_hw_reset(ctx); |
| } |
| |
| const struct coda_context_ops coda9_jpeg_decode_ops = { |
| .queue_init = coda_encoder_queue_init, /* non-bitstream operation */ |
| .start_streaming = coda9_jpeg_start_decoding, |
| .prepare_run = coda9_jpeg_prepare_decode, |
| .finish_run = coda9_jpeg_finish_decode, |
| .release = coda9_jpeg_release, |
| }; |
| |
| irqreturn_t coda9_jpeg_irq_handler(int irq, void *data) |
| { |
| struct coda_dev *dev = data; |
| struct coda_ctx *ctx; |
| int status; |
| int err_mb; |
| |
| status = coda_read(dev, CODA9_REG_JPEG_PIC_STATUS); |
| if (status == 0) |
| return IRQ_HANDLED; |
| coda_write(dev, status, CODA9_REG_JPEG_PIC_STATUS); |
| |
| if (status & CODA9_JPEG_STATUS_OVERFLOW) |
| v4l2_err(&dev->v4l2_dev, "JPEG overflow\n"); |
| |
| if (status & CODA9_JPEG_STATUS_BBC_INT) |
| v4l2_err(&dev->v4l2_dev, "JPEG BBC interrupt\n"); |
| |
| if (status & CODA9_JPEG_STATUS_ERROR) { |
| v4l2_err(&dev->v4l2_dev, "JPEG error\n"); |
| |
| err_mb = coda_read(dev, CODA9_REG_JPEG_PIC_ERRMB); |
| if (err_mb) { |
| v4l2_err(&dev->v4l2_dev, |
| "ERRMB: 0x%x: rst idx %d, mcu pos (%d,%d)\n", |
| err_mb, err_mb >> 24, (err_mb >> 12) & 0xfff, |
| err_mb & 0xfff); |
| } |
| } |
| |
| ctx = v4l2_m2m_get_curr_priv(dev->m2m_dev); |
| if (!ctx) { |
| v4l2_err(&dev->v4l2_dev, |
| "Instance released before the end of transaction\n"); |
| mutex_unlock(&dev->coda_mutex); |
| return IRQ_HANDLED; |
| } |
| |
| complete(&ctx->completion); |
| |
| return IRQ_HANDLED; |
| } |