diff options
Diffstat (limited to 'drivers/media/platform/sh_veu.c')
| -rw-r--r-- | drivers/media/platform/sh_veu.c | 1250 | 
1 files changed, 1250 insertions, 0 deletions
diff --git a/drivers/media/platform/sh_veu.c b/drivers/media/platform/sh_veu.c new file mode 100644 index 00000000000..744e43b480b --- /dev/null +++ b/drivers/media/platform/sh_veu.c @@ -0,0 +1,1250 @@ +/* + * sh-mobile VEU mem2mem driver + * + * Copyright (C) 2012 Renesas Electronics Corporation + * Author: Guennadi Liakhovetski, <g.liakhovetski@gmx.de> + * Copyright (C) 2008 Magnus Damm + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the version 2 of the GNU General Public License as + * published by the Free Software Foundation + */ + +#include <linux/err.h> +#include <linux/fs.h> +#include <linux/kernel.h> +#include <linux/module.h> +#include <linux/interrupt.h> +#include <linux/io.h> +#include <linux/platform_device.h> +#include <linux/pm_runtime.h> +#include <linux/slab.h> +#include <linux/types.h> +#include <linux/videodev2.h> + +#include <media/v4l2-dev.h> +#include <media/v4l2-device.h> +#include <media/v4l2-ioctl.h> +#include <media/v4l2-mem2mem.h> +#include <media/videobuf2-dma-contig.h> + +#define VEU_STR 0x00 /* start register */ +#define VEU_SWR 0x10 /* src: line length */ +#define VEU_SSR 0x14 /* src: image size */ +#define VEU_SAYR 0x18 /* src: y/rgb plane address */ +#define VEU_SACR 0x1c /* src: c plane address */ +#define VEU_BSSR 0x20 /* bundle mode register */ +#define VEU_EDWR 0x30 /* dst: line length */ +#define VEU_DAYR 0x34 /* dst: y/rgb plane address */ +#define VEU_DACR 0x38 /* dst: c plane address */ +#define VEU_TRCR 0x50 /* transform control */ +#define VEU_RFCR 0x54 /* resize scale */ +#define VEU_RFSR 0x58 /* resize clip */ +#define VEU_ENHR 0x5c /* enhance */ +#define VEU_FMCR 0x70 /* filter mode */ +#define VEU_VTCR 0x74 /* lowpass vertical */ +#define VEU_HTCR 0x78 /* lowpass horizontal */ +#define VEU_APCR 0x80 /* color match */ +#define VEU_ECCR 0x84 /* color replace */ +#define VEU_AFXR 0x90 /* fixed mode */ +#define VEU_SWPR 0x94 /* swap */ +#define VEU_EIER 0xa0 /* interrupt mask */ +#define VEU_EVTR 0xa4 /* interrupt event */ +#define VEU_STAR 0xb0 /* status */ +#define VEU_BSRR 0xb4 /* reset */ + +#define VEU_MCR00 0x200 /* color conversion matrix coefficient 00 */ +#define VEU_MCR01 0x204 /* color conversion matrix coefficient 01 */ +#define VEU_MCR02 0x208 /* color conversion matrix coefficient 02 */ +#define VEU_MCR10 0x20c /* color conversion matrix coefficient 10 */ +#define VEU_MCR11 0x210 /* color conversion matrix coefficient 11 */ +#define VEU_MCR12 0x214 /* color conversion matrix coefficient 12 */ +#define VEU_MCR20 0x218 /* color conversion matrix coefficient 20 */ +#define VEU_MCR21 0x21c /* color conversion matrix coefficient 21 */ +#define VEU_MCR22 0x220 /* color conversion matrix coefficient 22 */ +#define VEU_COFFR 0x224 /* color conversion offset */ +#define VEU_CBR   0x228 /* color conversion clip */ + +/* + * 4092x4092 max size is the normal case. In some cases it can be reduced to + * 2048x2048, in other cases it can be 4092x8188 or even 8188x8188. + */ +#define MAX_W 4092 +#define MAX_H 4092 +#define MIN_W 8 +#define MIN_H 8 +#define ALIGN_W 4 + +/* 3 buffers of 2048 x 1536 - 3 megapixels @ 16bpp */ +#define VIDEO_MEM_LIMIT ALIGN(2048 * 1536 * 2 * 3, 1024 * 1024) + +#define MEM2MEM_DEF_TRANSLEN 1 + +struct sh_veu_dev; + +struct sh_veu_file { +	struct sh_veu_dev *veu_dev; +	bool cfg_needed; +}; + +struct sh_veu_format { +	char *name; +	u32 fourcc; +	unsigned int depth; +	unsigned int ydepth; +}; + +/* video data format */ +struct sh_veu_vfmt { +	/* Replace with v4l2_rect */ +	struct v4l2_rect		frame; +	unsigned int			bytesperline; +	unsigned int			offset_y; +	unsigned int			offset_c; +	const struct sh_veu_format	*fmt; +}; + +struct sh_veu_dev { +	struct v4l2_device v4l2_dev; +	struct video_device vdev; +	struct v4l2_m2m_dev *m2m_dev; +	struct device *dev; +	struct v4l2_m2m_ctx *m2m_ctx; +	struct sh_veu_vfmt vfmt_out; +	struct sh_veu_vfmt vfmt_in; +	/* Only single user per direction so far */ +	struct sh_veu_file *capture; +	struct sh_veu_file *output; +	struct mutex fop_lock; +	void __iomem *base; +	struct vb2_alloc_ctx *alloc_ctx; +	spinlock_t lock; +	bool is_2h; +	unsigned int xaction; +	bool aborting; +}; + +enum sh_veu_fmt_idx { +	SH_VEU_FMT_NV12, +	SH_VEU_FMT_NV16, +	SH_VEU_FMT_NV24, +	SH_VEU_FMT_RGB332, +	SH_VEU_FMT_RGB444, +	SH_VEU_FMT_RGB565, +	SH_VEU_FMT_RGB666, +	SH_VEU_FMT_RGB24, +}; + +#define VGA_WIDTH	640 +#define VGA_HEIGHT	480 + +#define DEFAULT_IN_WIDTH	VGA_WIDTH +#define DEFAULT_IN_HEIGHT	VGA_HEIGHT +#define DEFAULT_IN_FMTIDX	SH_VEU_FMT_NV12 +#define DEFAULT_OUT_WIDTH	VGA_WIDTH +#define DEFAULT_OUT_HEIGHT	VGA_HEIGHT +#define DEFAULT_OUT_FMTIDX	SH_VEU_FMT_RGB565 + +/* + * Alignment: Y-plane should be 4-byte aligned for NV12 and NV16, and 8-byte + * aligned for NV24. + */ +static const struct sh_veu_format sh_veu_fmt[] = { +	[SH_VEU_FMT_NV12]   = { .ydepth = 8, .depth = 12, .name = "NV12", .fourcc = V4L2_PIX_FMT_NV12 }, +	[SH_VEU_FMT_NV16]   = { .ydepth = 8, .depth = 16, .name = "NV16", .fourcc = V4L2_PIX_FMT_NV16 }, +	[SH_VEU_FMT_NV24]   = { .ydepth = 8, .depth = 24, .name = "NV24", .fourcc = V4L2_PIX_FMT_NV24 }, +	[SH_VEU_FMT_RGB332] = { .ydepth = 8, .depth = 8, .name = "RGB332", .fourcc = V4L2_PIX_FMT_RGB332 }, +	[SH_VEU_FMT_RGB444] = { .ydepth = 16, .depth = 16, .name = "RGB444", .fourcc = V4L2_PIX_FMT_RGB444 }, +	[SH_VEU_FMT_RGB565] = { .ydepth = 16, .depth = 16, .name = "RGB565", .fourcc = V4L2_PIX_FMT_RGB565 }, +	[SH_VEU_FMT_RGB666] = { .ydepth = 32, .depth = 32, .name = "BGR666", .fourcc = V4L2_PIX_FMT_BGR666 }, +	[SH_VEU_FMT_RGB24]  = { .ydepth = 24, .depth = 24, .name = "RGB24", .fourcc = V4L2_PIX_FMT_RGB24 }, +}; + +#define DEFAULT_IN_VFMT (struct sh_veu_vfmt){						\ +	.frame = {									\ +		.width = VGA_WIDTH,							\ +		.height = VGA_HEIGHT,							\ +	},										\ +	.bytesperline = (VGA_WIDTH * sh_veu_fmt[DEFAULT_IN_FMTIDX].ydepth) >> 3,	\ +	.fmt = &sh_veu_fmt[DEFAULT_IN_FMTIDX],						\ +} + +#define DEFAULT_OUT_VFMT (struct sh_veu_vfmt){						\ +	.frame = {									\ +		.width = VGA_WIDTH,							\ +		.height = VGA_HEIGHT,							\ +	},										\ +	.bytesperline = (VGA_WIDTH * sh_veu_fmt[DEFAULT_OUT_FMTIDX].ydepth) >> 3,	\ +	.fmt = &sh_veu_fmt[DEFAULT_OUT_FMTIDX],						\ +} + +/* + * TODO: add support for further output formats: + *	SH_VEU_FMT_NV12, + *	SH_VEU_FMT_NV16, + *	SH_VEU_FMT_NV24, + *	SH_VEU_FMT_RGB332, + *	SH_VEU_FMT_RGB444, + *	SH_VEU_FMT_RGB666, + *	SH_VEU_FMT_RGB24, + */ + +static const int sh_veu_fmt_out[] = { +	SH_VEU_FMT_RGB565, +}; + +/* + * TODO: add support for further input formats: + *	SH_VEU_FMT_NV16, + *	SH_VEU_FMT_NV24, + *	SH_VEU_FMT_RGB565, + *	SH_VEU_FMT_RGB666, + *	SH_VEU_FMT_RGB24, + */ +static const int sh_veu_fmt_in[] = { +	SH_VEU_FMT_NV12, +}; + +static enum v4l2_colorspace sh_veu_4cc2cspace(u32 fourcc) +{ +	switch (fourcc) { +	default: +		BUG(); +	case V4L2_PIX_FMT_NV12: +	case V4L2_PIX_FMT_NV16: +	case V4L2_PIX_FMT_NV24: +		return V4L2_COLORSPACE_JPEG; +	case V4L2_PIX_FMT_RGB332: +	case V4L2_PIX_FMT_RGB444: +	case V4L2_PIX_FMT_RGB565: +	case V4L2_PIX_FMT_BGR666: +	case V4L2_PIX_FMT_RGB24: +		return V4L2_COLORSPACE_SRGB; +	} +} + +static u32 sh_veu_reg_read(struct sh_veu_dev *veu, unsigned int reg) +{ +	return ioread32(veu->base + reg); +} + +static void sh_veu_reg_write(struct sh_veu_dev *veu, unsigned int reg, +			     u32 value) +{ +	iowrite32(value, veu->base + reg); +} + +		/* ========== mem2mem callbacks ========== */ + +static void sh_veu_job_abort(void *priv) +{ +	struct sh_veu_dev *veu = priv; + +	/* Will cancel the transaction in the next interrupt handler */ +	veu->aborting = true; +} + +static void sh_veu_lock(void *priv) +{ +	struct sh_veu_dev *veu = priv; + +	mutex_lock(&veu->fop_lock); +} + +static void sh_veu_unlock(void *priv) +{ +	struct sh_veu_dev *veu = priv; + +	mutex_unlock(&veu->fop_lock); +} + +static void sh_veu_process(struct sh_veu_dev *veu, +			   struct vb2_buffer *src_buf, +			   struct vb2_buffer *dst_buf) +{ +	dma_addr_t addr = vb2_dma_contig_plane_dma_addr(dst_buf, 0); + +	sh_veu_reg_write(veu, VEU_DAYR, addr + veu->vfmt_out.offset_y); +	sh_veu_reg_write(veu, VEU_DACR, veu->vfmt_out.offset_c ? +			 addr + veu->vfmt_out.offset_c : 0); +	dev_dbg(veu->dev, "%s(): dst base %lx, y: %x, c: %x\n", __func__, +		(unsigned long)addr, +		veu->vfmt_out.offset_y, veu->vfmt_out.offset_c); + +	addr = vb2_dma_contig_plane_dma_addr(src_buf, 0); +	sh_veu_reg_write(veu, VEU_SAYR, addr + veu->vfmt_in.offset_y); +	sh_veu_reg_write(veu, VEU_SACR, veu->vfmt_in.offset_c ? +			 addr + veu->vfmt_in.offset_c : 0); +	dev_dbg(veu->dev, "%s(): src base %lx, y: %x, c: %x\n", __func__, +		(unsigned long)addr, +		veu->vfmt_in.offset_y, veu->vfmt_in.offset_c); + +	sh_veu_reg_write(veu, VEU_STR, 1); + +	sh_veu_reg_write(veu, VEU_EIER, 1); /* enable interrupt in VEU */ +} + +/** + * sh_veu_device_run() - prepares and starts the device + * + * This will be called by the framework when it decides to schedule a particular + * instance. + */ +static void sh_veu_device_run(void *priv) +{ +	struct sh_veu_dev *veu = priv; +	struct vb2_buffer *src_buf, *dst_buf; + +	src_buf = v4l2_m2m_next_src_buf(veu->m2m_ctx); +	dst_buf = v4l2_m2m_next_dst_buf(veu->m2m_ctx); + +	if (src_buf && dst_buf) +		sh_veu_process(veu, src_buf, dst_buf); +} + +		/* ========== video ioctls ========== */ + +static bool sh_veu_is_streamer(struct sh_veu_dev *veu, struct sh_veu_file *veu_file, +			       enum v4l2_buf_type type) +{ +	return (type == V4L2_BUF_TYPE_VIDEO_CAPTURE && +		veu_file == veu->capture) || +		(type == V4L2_BUF_TYPE_VIDEO_OUTPUT && +		 veu_file == veu->output); +} + +static int sh_veu_queue_init(void *priv, struct vb2_queue *src_vq, +			     struct vb2_queue *dst_vq); + +/* + * It is not unusual to have video nodes open()ed multiple times. While some + * V4L2 operations are non-intrusive, like querying formats and various + * parameters, others, like setting formats, starting and stopping streaming, + * queuing and dequeuing buffers, directly affect hardware configuration and / + * or execution. This function verifies availability of the requested interface + * and, if available, reserves it for the requesting user. + */ +static int sh_veu_stream_init(struct sh_veu_dev *veu, struct sh_veu_file *veu_file, +			      enum v4l2_buf_type type) +{ +	struct sh_veu_file **stream; + +	switch (type) { +	case V4L2_BUF_TYPE_VIDEO_CAPTURE: +		stream = &veu->capture; +		break; +	case V4L2_BUF_TYPE_VIDEO_OUTPUT: +		stream = &veu->output; +		break; +	default: +		return -EINVAL; +	} + +	if (*stream == veu_file) +		return 0; + +	if (*stream) +		return -EBUSY; + +	*stream = veu_file; + +	return 0; +} + +static int sh_veu_context_init(struct sh_veu_dev *veu) +{ +	if (veu->m2m_ctx) +		return 0; + +	veu->m2m_ctx = v4l2_m2m_ctx_init(veu->m2m_dev, veu, +					 sh_veu_queue_init); + +	return PTR_ERR_OR_ZERO(veu->m2m_ctx); +} + +static int sh_veu_querycap(struct file *file, void *priv, +			   struct v4l2_capability *cap) +{ +	strlcpy(cap->driver, "sh-veu", sizeof(cap->driver)); +	strlcpy(cap->card, "sh-mobile VEU", sizeof(cap->card)); +	strlcpy(cap->bus_info, "platform:sh-veu", sizeof(cap->bus_info)); +	cap->device_caps = V4L2_CAP_VIDEO_M2M | V4L2_CAP_STREAMING; +	cap->capabilities = cap->device_caps | V4L2_CAP_DEVICE_CAPS; + +	return 0; +} + +static int sh_veu_enum_fmt(struct v4l2_fmtdesc *f, const int *fmt, int fmt_num) +{ +	if (f->index >= fmt_num) +		return -EINVAL; + +	strlcpy(f->description, sh_veu_fmt[fmt[f->index]].name, sizeof(f->description)); +	f->pixelformat = sh_veu_fmt[fmt[f->index]].fourcc; +	return 0; +} + +static int sh_veu_enum_fmt_vid_cap(struct file *file, void *priv, +				   struct v4l2_fmtdesc *f) +{ +	return sh_veu_enum_fmt(f, sh_veu_fmt_out, ARRAY_SIZE(sh_veu_fmt_out)); +} + +static int sh_veu_enum_fmt_vid_out(struct file *file, void *priv, +				   struct v4l2_fmtdesc *f) +{ +	return sh_veu_enum_fmt(f, sh_veu_fmt_in, ARRAY_SIZE(sh_veu_fmt_in)); +} + +static struct sh_veu_vfmt *sh_veu_get_vfmt(struct sh_veu_dev *veu, +					   enum v4l2_buf_type type) +{ +	switch (type) { +	case V4L2_BUF_TYPE_VIDEO_CAPTURE: +		return &veu->vfmt_out; +	case V4L2_BUF_TYPE_VIDEO_OUTPUT: +		return &veu->vfmt_in; +	default: +		return NULL; +	} +} + +static int sh_veu_g_fmt(struct sh_veu_file *veu_file, struct v4l2_format *f) +{ +	struct v4l2_pix_format *pix = &f->fmt.pix; +	struct sh_veu_dev *veu = veu_file->veu_dev; +	struct sh_veu_vfmt *vfmt; + +	vfmt = sh_veu_get_vfmt(veu, f->type); + +	pix->width		= vfmt->frame.width; +	pix->height		= vfmt->frame.height; +	pix->field		= V4L2_FIELD_NONE; +	pix->pixelformat	= vfmt->fmt->fourcc; +	pix->colorspace		= sh_veu_4cc2cspace(pix->pixelformat); +	pix->bytesperline	= vfmt->bytesperline; +	pix->sizeimage		= vfmt->bytesperline * pix->height * +		vfmt->fmt->depth / vfmt->fmt->ydepth; +	pix->priv		= 0; +	dev_dbg(veu->dev, "%s(): type: %d, size %u @ %ux%u, fmt %x\n", __func__, +		f->type, pix->sizeimage, pix->width, pix->height, pix->pixelformat); + +	return 0; +} + +static int sh_veu_g_fmt_vid_out(struct file *file, void *priv, +				struct v4l2_format *f) +{ +	return sh_veu_g_fmt(priv, f); +} + +static int sh_veu_g_fmt_vid_cap(struct file *file, void *priv, +				struct v4l2_format *f) +{ +	return sh_veu_g_fmt(priv, f); +} + +static int sh_veu_try_fmt(struct v4l2_format *f, const struct sh_veu_format *fmt) +{ +	struct v4l2_pix_format *pix = &f->fmt.pix; +	unsigned int y_bytes_used; + +	/* +	 * V4L2 specification suggests, that the driver should correct the +	 * format struct if any of the dimensions is unsupported +	 */ +	switch (pix->field) { +	default: +	case V4L2_FIELD_ANY: +		pix->field = V4L2_FIELD_NONE; +		/* fall through: continue handling V4L2_FIELD_NONE */ +	case V4L2_FIELD_NONE: +		break; +	} + +	v4l_bound_align_image(&pix->width, MIN_W, MAX_W, ALIGN_W, +			      &pix->height, MIN_H, MAX_H, 0, 0); + +	y_bytes_used = (pix->width * fmt->ydepth) >> 3; + +	if (pix->bytesperline < y_bytes_used) +		pix->bytesperline = y_bytes_used; +	pix->sizeimage = pix->height * pix->bytesperline * fmt->depth / fmt->ydepth; + +	pix->pixelformat	= fmt->fourcc; +	pix->colorspace		= sh_veu_4cc2cspace(pix->pixelformat); +	pix->priv		= 0; + +	pr_debug("%s(): type: %d, size %u\n", __func__, f->type, pix->sizeimage); + +	return 0; +} + +static const struct sh_veu_format *sh_veu_find_fmt(const struct v4l2_format *f) +{ +	const int *fmt; +	int i, n, dflt; + +	pr_debug("%s(%d;%d)\n", __func__, f->type, f->fmt.pix.field); + +	switch (f->type) { +	case V4L2_BUF_TYPE_VIDEO_CAPTURE: +		fmt = sh_veu_fmt_out; +		n = ARRAY_SIZE(sh_veu_fmt_out); +		dflt = DEFAULT_OUT_FMTIDX; +		break; +	case V4L2_BUF_TYPE_VIDEO_OUTPUT: +	default: +		fmt = sh_veu_fmt_in; +		n = ARRAY_SIZE(sh_veu_fmt_in); +		dflt = DEFAULT_IN_FMTIDX; +		break; +	} + +	for (i = 0; i < n; i++) +		if (sh_veu_fmt[fmt[i]].fourcc == f->fmt.pix.pixelformat) +			return &sh_veu_fmt[fmt[i]]; + +	return &sh_veu_fmt[dflt]; +} + +static int sh_veu_try_fmt_vid_cap(struct file *file, void *priv, +				  struct v4l2_format *f) +{ +	const struct sh_veu_format *fmt; + +	fmt = sh_veu_find_fmt(f); +	if (!fmt) +		/* wrong buffer type */ +		return -EINVAL; + +	return sh_veu_try_fmt(f, fmt); +} + +static int sh_veu_try_fmt_vid_out(struct file *file, void *priv, +				  struct v4l2_format *f) +{ +	const struct sh_veu_format *fmt; + +	fmt = sh_veu_find_fmt(f); +	if (!fmt) +		/* wrong buffer type */ +		return -EINVAL; + +	return sh_veu_try_fmt(f, fmt); +} + +static void sh_veu_colour_offset(struct sh_veu_dev *veu, struct sh_veu_vfmt *vfmt) +{ +	/* dst_left and dst_top validity will be verified in CROP / COMPOSE */ +	unsigned int left = vfmt->frame.left & ~0x03; +	unsigned int top = vfmt->frame.top; +	dma_addr_t offset = ((left * veu->vfmt_out.fmt->depth) >> 3) + +		top * veu->vfmt_out.bytesperline; +	unsigned int y_line; + +	vfmt->offset_y = offset; + +	switch (vfmt->fmt->fourcc) { +	case V4L2_PIX_FMT_NV12: +	case V4L2_PIX_FMT_NV16: +	case V4L2_PIX_FMT_NV24: +		y_line = ALIGN(vfmt->frame.width, 16); +		vfmt->offset_c = offset + y_line * vfmt->frame.height; +		break; +	case V4L2_PIX_FMT_RGB332: +	case V4L2_PIX_FMT_RGB444: +	case V4L2_PIX_FMT_RGB565: +	case V4L2_PIX_FMT_BGR666: +	case V4L2_PIX_FMT_RGB24: +		vfmt->offset_c = 0; +		break; +	default: +		BUG(); +	} +} + +static int sh_veu_s_fmt(struct sh_veu_file *veu_file, struct v4l2_format *f) +{ +	struct v4l2_pix_format *pix = &f->fmt.pix; +	struct sh_veu_dev *veu = veu_file->veu_dev; +	struct sh_veu_vfmt *vfmt; +	struct vb2_queue *vq; +	int ret = sh_veu_context_init(veu); +	if (ret < 0) +		return ret; + +	vq = v4l2_m2m_get_vq(veu->m2m_ctx, f->type); +	if (!vq) +		return -EINVAL; + +	if (vb2_is_busy(vq)) { +		v4l2_err(&veu_file->veu_dev->v4l2_dev, "%s queue busy\n", __func__); +		return -EBUSY; +	} + +	vfmt = sh_veu_get_vfmt(veu, f->type); +	/* called after try_fmt(), hence vfmt != NULL. Implicit BUG_ON() below */ + +	vfmt->fmt		= sh_veu_find_fmt(f); +	/* vfmt->fmt != NULL following the same argument as above */ +	vfmt->frame.width	= pix->width; +	vfmt->frame.height	= pix->height; +	vfmt->bytesperline	= pix->bytesperline; + +	sh_veu_colour_offset(veu, vfmt); + +	/* +	 * We could also verify and require configuration only if any parameters +	 * actually have changed, but it is unlikely, that the user requests the +	 * same configuration several times without closing the device. +	 */ +	veu_file->cfg_needed = true; + +	dev_dbg(veu->dev, +		"Setting format for type %d, wxh: %dx%d, fmt: %x\n", +		f->type, pix->width, pix->height, vfmt->fmt->fourcc); + +	return 0; +} + +static int sh_veu_s_fmt_vid_cap(struct file *file, void *priv, +				struct v4l2_format *f) +{ +	int ret = sh_veu_try_fmt_vid_cap(file, priv, f); +	if (ret) +		return ret; + +	return sh_veu_s_fmt(priv, f); +} + +static int sh_veu_s_fmt_vid_out(struct file *file, void *priv, +				struct v4l2_format *f) +{ +	int ret = sh_veu_try_fmt_vid_out(file, priv, f); +	if (ret) +		return ret; + +	return sh_veu_s_fmt(priv, f); +} + +static int sh_veu_reqbufs(struct file *file, void *priv, +			  struct v4l2_requestbuffers *reqbufs) +{ +	struct sh_veu_file *veu_file = priv; +	struct sh_veu_dev *veu = veu_file->veu_dev; +	int ret = sh_veu_context_init(veu); +	if (ret < 0) +		return ret; + +	ret = sh_veu_stream_init(veu, veu_file, reqbufs->type); +	if (ret < 0) +		return ret; + +	return v4l2_m2m_reqbufs(file, veu->m2m_ctx, reqbufs); +} + +static int sh_veu_querybuf(struct file *file, void *priv, +			   struct v4l2_buffer *buf) +{ +	struct sh_veu_file *veu_file = priv; + +	if (!sh_veu_is_streamer(veu_file->veu_dev, veu_file, buf->type)) +		return -EBUSY; + +	return v4l2_m2m_querybuf(file, veu_file->veu_dev->m2m_ctx, buf); +} + +static int sh_veu_qbuf(struct file *file, void *priv, struct v4l2_buffer *buf) +{ +	struct sh_veu_file *veu_file = priv; + +	dev_dbg(veu_file->veu_dev->dev, "%s(%d)\n", __func__, buf->type); +	if (!sh_veu_is_streamer(veu_file->veu_dev, veu_file, buf->type)) +		return -EBUSY; + +	return v4l2_m2m_qbuf(file, veu_file->veu_dev->m2m_ctx, buf); +} + +static int sh_veu_dqbuf(struct file *file, void *priv, struct v4l2_buffer *buf) +{ +	struct sh_veu_file *veu_file = priv; + +	dev_dbg(veu_file->veu_dev->dev, "%s(%d)\n", __func__, buf->type); +	if (!sh_veu_is_streamer(veu_file->veu_dev, veu_file, buf->type)) +		return -EBUSY; + +	return v4l2_m2m_dqbuf(file, veu_file->veu_dev->m2m_ctx, buf); +} + +static void sh_veu_calc_scale(struct sh_veu_dev *veu, +			      int size_in, int size_out, int crop_out, +			      u32 *mant, u32 *frac, u32 *rep) +{ +	u32 fixpoint; + +	/* calculate FRAC and MANT */ +	*rep = *mant = *frac = 0; + +	if (size_in == size_out) { +		if (crop_out != size_out) +			*mant = 1; /* needed for cropping */ +		return; +	} + +	/* VEU2H special upscale */ +	if (veu->is_2h && size_out > size_in) { +		u32 fixpoint = (4096 * size_in) / size_out; +		*mant = fixpoint / 4096; +		*frac = (fixpoint - (*mant * 4096)) & ~0x07; + +		switch (*frac) { +		case 0x800: +			*rep = 1; +			break; +		case 0x400: +			*rep = 3; +			break; +		case 0x200: +			*rep = 7; +			break; +		} +		if (*rep) +			return; +	} + +	fixpoint = (4096 * (size_in - 1)) / (size_out + 1); +	*mant = fixpoint / 4096; +	*frac = fixpoint - (*mant * 4096); + +	if (*frac & 0x07) { +		/* +		 * FIXME: do we really have to round down twice in the +		 * up-scaling case? +		 */ +		*frac &= ~0x07; +		if (size_out > size_in) +			*frac -= 8; /* round down if scaling up */ +		else +			*frac += 8; /* round up if scaling down */ +	} +} + +static unsigned long sh_veu_scale_v(struct sh_veu_dev *veu, +				    int size_in, int size_out, int crop_out) +{ +	u32 mant, frac, value, rep; + +	sh_veu_calc_scale(veu, size_in, size_out, crop_out, &mant, &frac, &rep); + +	/* set scale */ +	value = (sh_veu_reg_read(veu, VEU_RFCR) & ~0xffff0000) | +		(((mant << 12) | frac) << 16); + +	sh_veu_reg_write(veu, VEU_RFCR, value); + +	/* set clip */ +	value = (sh_veu_reg_read(veu, VEU_RFSR) & ~0xffff0000) | +		(((rep << 12) | crop_out) << 16); + +	sh_veu_reg_write(veu, VEU_RFSR, value); + +	return ALIGN((size_in * crop_out) / size_out, 4); +} + +static unsigned long sh_veu_scale_h(struct sh_veu_dev *veu, +				    int size_in, int size_out, int crop_out) +{ +	u32 mant, frac, value, rep; + +	sh_veu_calc_scale(veu, size_in, size_out, crop_out, &mant, &frac, &rep); + +	/* set scale */ +	value = (sh_veu_reg_read(veu, VEU_RFCR) & ~0xffff) | +		(mant << 12) | frac; + +	sh_veu_reg_write(veu, VEU_RFCR, value); + +	/* set clip */ +	value = (sh_veu_reg_read(veu, VEU_RFSR) & ~0xffff) | +		(rep << 12) | crop_out; + +	sh_veu_reg_write(veu, VEU_RFSR, value); + +	return ALIGN((size_in * crop_out) / size_out, 4); +} + +static void sh_veu_configure(struct sh_veu_dev *veu) +{ +	u32 src_width, src_stride, src_height; +	u32 dst_width, dst_stride, dst_height; +	u32 real_w, real_h; + +	/* reset VEU */ +	sh_veu_reg_write(veu, VEU_BSRR, 0x100); + +	src_width = veu->vfmt_in.frame.width; +	src_height = veu->vfmt_in.frame.height; +	src_stride = ALIGN(veu->vfmt_in.frame.width, 16); + +	dst_width = real_w = veu->vfmt_out.frame.width; +	dst_height = real_h = veu->vfmt_out.frame.height; +	/* Datasheet is unclear - whether it's always number of bytes or not */ +	dst_stride = veu->vfmt_out.bytesperline; + +	/* +	 * So far real_w == dst_width && real_h == dst_height, but it wasn't +	 * necessarily the case in the original vidix driver, so, it may change +	 * here in the future too. +	 */ +	src_width = sh_veu_scale_h(veu, src_width, real_w, dst_width); +	src_height = sh_veu_scale_v(veu, src_height, real_h, dst_height); + +	sh_veu_reg_write(veu, VEU_SWR, src_stride); +	sh_veu_reg_write(veu, VEU_SSR, src_width | (src_height << 16)); +	sh_veu_reg_write(veu, VEU_BSSR, 0); /* not using bundle mode */ + +	sh_veu_reg_write(veu, VEU_EDWR, dst_stride); +	sh_veu_reg_write(veu, VEU_DACR, 0); /* unused for RGB */ + +	sh_veu_reg_write(veu, VEU_SWPR, 0x67); +	sh_veu_reg_write(veu, VEU_TRCR, (6 << 16) | (0 << 14) | 2 | 4); + +	if (veu->is_2h) { +		sh_veu_reg_write(veu, VEU_MCR00, 0x0cc5); +		sh_veu_reg_write(veu, VEU_MCR01, 0x0950); +		sh_veu_reg_write(veu, VEU_MCR02, 0x0000); + +		sh_veu_reg_write(veu, VEU_MCR10, 0x397f); +		sh_veu_reg_write(veu, VEU_MCR11, 0x0950); +		sh_veu_reg_write(veu, VEU_MCR12, 0x3ccd); + +		sh_veu_reg_write(veu, VEU_MCR20, 0x0000); +		sh_veu_reg_write(veu, VEU_MCR21, 0x0950); +		sh_veu_reg_write(veu, VEU_MCR22, 0x1023); + +		sh_veu_reg_write(veu, VEU_COFFR, 0x00800010); +	} +} + +static int sh_veu_streamon(struct file *file, void *priv, +			   enum v4l2_buf_type type) +{ +	struct sh_veu_file *veu_file = priv; + +	if (!sh_veu_is_streamer(veu_file->veu_dev, veu_file, type)) +		return -EBUSY; + +	if (veu_file->cfg_needed) { +		struct sh_veu_dev *veu = veu_file->veu_dev; +		veu_file->cfg_needed = false; +		sh_veu_configure(veu_file->veu_dev); +		veu->xaction = 0; +		veu->aborting = false; +	} + +	return v4l2_m2m_streamon(file, veu_file->veu_dev->m2m_ctx, type); +} + +static int sh_veu_streamoff(struct file *file, void *priv, +			    enum v4l2_buf_type type) +{ +	struct sh_veu_file *veu_file = priv; + +	if (!sh_veu_is_streamer(veu_file->veu_dev, veu_file, type)) +		return -EBUSY; + +	return v4l2_m2m_streamoff(file, veu_file->veu_dev->m2m_ctx, type); +} + +static const struct v4l2_ioctl_ops sh_veu_ioctl_ops = { +	.vidioc_querycap	= sh_veu_querycap, + +	.vidioc_enum_fmt_vid_cap = sh_veu_enum_fmt_vid_cap, +	.vidioc_g_fmt_vid_cap	= sh_veu_g_fmt_vid_cap, +	.vidioc_try_fmt_vid_cap	= sh_veu_try_fmt_vid_cap, +	.vidioc_s_fmt_vid_cap	= sh_veu_s_fmt_vid_cap, + +	.vidioc_enum_fmt_vid_out = sh_veu_enum_fmt_vid_out, +	.vidioc_g_fmt_vid_out	= sh_veu_g_fmt_vid_out, +	.vidioc_try_fmt_vid_out	= sh_veu_try_fmt_vid_out, +	.vidioc_s_fmt_vid_out	= sh_veu_s_fmt_vid_out, + +	.vidioc_reqbufs		= sh_veu_reqbufs, +	.vidioc_querybuf	= sh_veu_querybuf, + +	.vidioc_qbuf		= sh_veu_qbuf, +	.vidioc_dqbuf		= sh_veu_dqbuf, + +	.vidioc_streamon	= sh_veu_streamon, +	.vidioc_streamoff	= sh_veu_streamoff, +}; + +		/* ========== Queue operations ========== */ + +static int sh_veu_queue_setup(struct vb2_queue *vq, +			      const struct v4l2_format *f, +			      unsigned int *nbuffers, unsigned int *nplanes, +			      unsigned int sizes[], void *alloc_ctxs[]) +{ +	struct sh_veu_dev *veu = vb2_get_drv_priv(vq); +	struct sh_veu_vfmt *vfmt; +	unsigned int size, count = *nbuffers; + +	if (f) { +		const struct v4l2_pix_format *pix = &f->fmt.pix; +		const struct sh_veu_format *fmt = sh_veu_find_fmt(f); +		struct v4l2_format ftmp = *f; + +		if (fmt->fourcc != pix->pixelformat) +			return -EINVAL; +		sh_veu_try_fmt(&ftmp, fmt); +		if (ftmp.fmt.pix.width != pix->width || +		    ftmp.fmt.pix.height != pix->height) +			return -EINVAL; +		size = pix->bytesperline ? pix->bytesperline * pix->height * fmt->depth / fmt->ydepth : +			pix->width * pix->height * fmt->depth / fmt->ydepth; +	} else { +		vfmt = sh_veu_get_vfmt(veu, vq->type); +		size = vfmt->bytesperline * vfmt->frame.height * vfmt->fmt->depth / vfmt->fmt->ydepth; +	} + +	if (count < 2) +		*nbuffers = count = 2; + +	if (size * count > VIDEO_MEM_LIMIT) { +		count = VIDEO_MEM_LIMIT / size; +		*nbuffers = count; +	} + +	*nplanes = 1; +	sizes[0] = size; +	alloc_ctxs[0] = veu->alloc_ctx; + +	dev_dbg(veu->dev, "get %d buffer(s) of size %d each.\n", count, size); + +	return 0; +} + +static int sh_veu_buf_prepare(struct vb2_buffer *vb) +{ +	struct sh_veu_dev *veu = vb2_get_drv_priv(vb->vb2_queue); +	struct sh_veu_vfmt *vfmt; +	unsigned int sizeimage; + +	vfmt = sh_veu_get_vfmt(veu, vb->vb2_queue->type); +	sizeimage = vfmt->bytesperline * vfmt->frame.height * +		vfmt->fmt->depth / vfmt->fmt->ydepth; + +	if (vb2_plane_size(vb, 0) < sizeimage) { +		dev_dbg(veu->dev, "%s data will not fit into plane (%lu < %u)\n", +			__func__, vb2_plane_size(vb, 0), sizeimage); +		return -EINVAL; +	} + +	vb2_set_plane_payload(vb, 0, sizeimage); + +	return 0; +} + +static void sh_veu_buf_queue(struct vb2_buffer *vb) +{ +	struct sh_veu_dev *veu = vb2_get_drv_priv(vb->vb2_queue); +	dev_dbg(veu->dev, "%s(%d)\n", __func__, vb->v4l2_buf.type); +	v4l2_m2m_buf_queue(veu->m2m_ctx, vb); +} + +static void sh_veu_wait_prepare(struct vb2_queue *q) +{ +	sh_veu_unlock(vb2_get_drv_priv(q)); +} + +static void sh_veu_wait_finish(struct vb2_queue *q) +{ +	sh_veu_lock(vb2_get_drv_priv(q)); +} + +static const struct vb2_ops sh_veu_qops = { +	.queue_setup	 = sh_veu_queue_setup, +	.buf_prepare	 = sh_veu_buf_prepare, +	.buf_queue	 = sh_veu_buf_queue, +	.wait_prepare	 = sh_veu_wait_prepare, +	.wait_finish	 = sh_veu_wait_finish, +}; + +static int sh_veu_queue_init(void *priv, struct vb2_queue *src_vq, +			     struct vb2_queue *dst_vq) +{ +	int ret; + +	memset(src_vq, 0, sizeof(*src_vq)); +	src_vq->type = V4L2_BUF_TYPE_VIDEO_OUTPUT; +	src_vq->io_modes = VB2_MMAP | VB2_USERPTR; +	src_vq->drv_priv = priv; +	src_vq->buf_struct_size = sizeof(struct v4l2_m2m_buffer); +	src_vq->ops = &sh_veu_qops; +	src_vq->mem_ops = &vb2_dma_contig_memops; + +	ret = vb2_queue_init(src_vq); +	if (ret < 0) +		return ret; + +	memset(dst_vq, 0, sizeof(*dst_vq)); +	dst_vq->type = V4L2_BUF_TYPE_VIDEO_CAPTURE; +	dst_vq->io_modes = VB2_MMAP | VB2_USERPTR; +	dst_vq->drv_priv = priv; +	dst_vq->buf_struct_size = sizeof(struct v4l2_m2m_buffer); +	dst_vq->ops = &sh_veu_qops; +	dst_vq->mem_ops = &vb2_dma_contig_memops; + +	return vb2_queue_init(dst_vq); +} + +		/* ========== File operations ========== */ + +static int sh_veu_open(struct file *file) +{ +	struct sh_veu_dev *veu = video_drvdata(file); +	struct sh_veu_file *veu_file; + +	veu_file = kzalloc(sizeof(*veu_file), GFP_KERNEL); +	if (!veu_file) +		return -ENOMEM; + +	veu_file->veu_dev = veu; +	veu_file->cfg_needed = true; + +	file->private_data = veu_file; + +	pm_runtime_get_sync(veu->dev); + +	dev_dbg(veu->dev, "Created instance %p\n", veu_file); + +	return 0; +} + +static int sh_veu_release(struct file *file) +{ +	struct sh_veu_dev *veu = video_drvdata(file); +	struct sh_veu_file *veu_file = file->private_data; + +	dev_dbg(veu->dev, "Releasing instance %p\n", veu_file); + +	if (veu_file == veu->capture) { +		veu->capture = NULL; +		vb2_queue_release(v4l2_m2m_get_vq(veu->m2m_ctx, V4L2_BUF_TYPE_VIDEO_CAPTURE)); +	} + +	if (veu_file == veu->output) { +		veu->output = NULL; +		vb2_queue_release(v4l2_m2m_get_vq(veu->m2m_ctx, V4L2_BUF_TYPE_VIDEO_OUTPUT)); +	} + +	if (!veu->output && !veu->capture && veu->m2m_ctx) { +		v4l2_m2m_ctx_release(veu->m2m_ctx); +		veu->m2m_ctx = NULL; +	} + +	pm_runtime_put(veu->dev); + +	kfree(veu_file); + +	return 0; +} + +static unsigned int sh_veu_poll(struct file *file, +				struct poll_table_struct *wait) +{ +	struct sh_veu_file *veu_file = file->private_data; + +	return v4l2_m2m_poll(file, veu_file->veu_dev->m2m_ctx, wait); +} + +static int sh_veu_mmap(struct file *file, struct vm_area_struct *vma) +{ +	struct sh_veu_file *veu_file = file->private_data; + +	return v4l2_m2m_mmap(file, veu_file->veu_dev->m2m_ctx, vma); +} + +static const struct v4l2_file_operations sh_veu_fops = { +	.owner		= THIS_MODULE, +	.open		= sh_veu_open, +	.release	= sh_veu_release, +	.poll		= sh_veu_poll, +	.unlocked_ioctl	= video_ioctl2, +	.mmap		= sh_veu_mmap, +}; + +static const struct video_device sh_veu_videodev = { +	.name		= "sh-veu", +	.fops		= &sh_veu_fops, +	.ioctl_ops	= &sh_veu_ioctl_ops, +	.minor		= -1, +	.release	= video_device_release_empty, +	.vfl_dir	= VFL_DIR_M2M, +}; + +static const struct v4l2_m2m_ops sh_veu_m2m_ops = { +	.device_run	= sh_veu_device_run, +	.job_abort	= sh_veu_job_abort, +}; + +static irqreturn_t sh_veu_bh(int irq, void *dev_id) +{ +	struct sh_veu_dev *veu = dev_id; + +	if (veu->xaction == MEM2MEM_DEF_TRANSLEN || veu->aborting) { +		v4l2_m2m_job_finish(veu->m2m_dev, veu->m2m_ctx); +		veu->xaction = 0; +	} else { +		sh_veu_device_run(veu); +	} + +	return IRQ_HANDLED; +} + +static irqreturn_t sh_veu_isr(int irq, void *dev_id) +{ +	struct sh_veu_dev *veu = dev_id; +	struct vb2_buffer *dst; +	struct vb2_buffer *src; +	u32 status = sh_veu_reg_read(veu, VEU_EVTR); + +	/* bundle read mode not used */ +	if (!(status & 1)) +		return IRQ_NONE; + +	/* disable interrupt in VEU */ +	sh_veu_reg_write(veu, VEU_EIER, 0); +	/* halt operation */ +	sh_veu_reg_write(veu, VEU_STR, 0); +	/* ack int, write 0 to clear bits */ +	sh_veu_reg_write(veu, VEU_EVTR, status & ~1); + +	/* conversion completed */ +	dst = v4l2_m2m_dst_buf_remove(veu->m2m_ctx); +	src = v4l2_m2m_src_buf_remove(veu->m2m_ctx); +	if (!src || !dst) +		return IRQ_NONE; + +	spin_lock(&veu->lock); +	v4l2_m2m_buf_done(src, VB2_BUF_STATE_DONE); +	v4l2_m2m_buf_done(dst, VB2_BUF_STATE_DONE); +	spin_unlock(&veu->lock); + +	veu->xaction++; + +	return IRQ_WAKE_THREAD; +} + +static int sh_veu_probe(struct platform_device *pdev) +{ +	struct sh_veu_dev *veu; +	struct resource *reg_res; +	struct video_device *vdev; +	int irq, ret; + +	reg_res = platform_get_resource(pdev, IORESOURCE_MEM, 0); +	irq = platform_get_irq(pdev, 0); + +	if (!reg_res || irq <= 0) { +		dev_err(&pdev->dev, "Insufficient VEU platform information.\n"); +		return -ENODEV; +	} + +	veu = devm_kzalloc(&pdev->dev, sizeof(*veu), GFP_KERNEL); +	if (!veu) +		return -ENOMEM; + +	veu->is_2h = resource_size(reg_res) == 0x22c; + +	veu->base = devm_ioremap_resource(&pdev->dev, reg_res); +	if (IS_ERR(veu->base)) +		return PTR_ERR(veu->base); + +	ret = devm_request_threaded_irq(&pdev->dev, irq, sh_veu_isr, sh_veu_bh, +					0, "veu", veu); +	if (ret < 0) +		return ret; + +	ret = v4l2_device_register(&pdev->dev, &veu->v4l2_dev); +	if (ret < 0) { +		dev_err(&pdev->dev, "Error registering v4l2 device\n"); +		return ret; +	} + +	vdev = &veu->vdev; + +	veu->alloc_ctx = vb2_dma_contig_init_ctx(&pdev->dev); +	if (IS_ERR(veu->alloc_ctx)) { +		ret = PTR_ERR(veu->alloc_ctx); +		goto einitctx; +	} + +	*vdev = sh_veu_videodev; +	spin_lock_init(&veu->lock); +	mutex_init(&veu->fop_lock); +	vdev->lock = &veu->fop_lock; + +	video_set_drvdata(vdev, veu); + +	veu->dev	= &pdev->dev; +	veu->vfmt_out	= DEFAULT_OUT_VFMT; +	veu->vfmt_in	= DEFAULT_IN_VFMT; + +	veu->m2m_dev = v4l2_m2m_init(&sh_veu_m2m_ops); +	if (IS_ERR(veu->m2m_dev)) { +		ret = PTR_ERR(veu->m2m_dev); +		v4l2_err(&veu->v4l2_dev, "Failed to init mem2mem device: %d\n", ret); +		goto em2minit; +	} + +	pm_runtime_enable(&pdev->dev); +	pm_runtime_resume(&pdev->dev); + +	ret = video_register_device(vdev, VFL_TYPE_GRABBER, -1); +	pm_runtime_suspend(&pdev->dev); +	if (ret < 0) +		goto evidreg; + +	return ret; + +evidreg: +	pm_runtime_disable(&pdev->dev); +	v4l2_m2m_release(veu->m2m_dev); +em2minit: +	vb2_dma_contig_cleanup_ctx(veu->alloc_ctx); +einitctx: +	v4l2_device_unregister(&veu->v4l2_dev); +	return ret; +} + +static int sh_veu_remove(struct platform_device *pdev) +{ +	struct v4l2_device *v4l2_dev = platform_get_drvdata(pdev); +	struct sh_veu_dev *veu = container_of(v4l2_dev, +					      struct sh_veu_dev, v4l2_dev); + +	video_unregister_device(&veu->vdev); +	pm_runtime_disable(&pdev->dev); +	v4l2_m2m_release(veu->m2m_dev); +	vb2_dma_contig_cleanup_ctx(veu->alloc_ctx); +	v4l2_device_unregister(&veu->v4l2_dev); + +	return 0; +} + +static struct platform_driver __refdata sh_veu_pdrv = { +	.remove		= sh_veu_remove, +	.driver		= { +		.name	= "sh_veu", +		.owner	= THIS_MODULE, +	}, +}; + +module_platform_driver_probe(sh_veu_pdrv, sh_veu_probe); + +MODULE_DESCRIPTION("sh-mobile VEU mem2mem driver"); +MODULE_AUTHOR("Guennadi Liakhovetski, <g.liakhovetski@gmx.de>"); +MODULE_LICENSE("GPL v2");  | 
