X-Git-Url: https://git.carlh.net/gitweb/?a=blobdiff_plain;f=src%2Flib%2Fimage.cc;h=dbea62d26b3b7363d7c33ce7df19dff170430a5f;hb=7b96999f95cd715ad49b1715602287fa4cae0950;hp=05270954dd6309271efacf30bd00f8f6d4849f5f;hpb=5161626c3c28ba528511a8b211286a5e81a0f02a;p=dcpomatic.git

diff --git a/src/lib/image.cc b/src/lib/image.cc
index 05270954d..dbea62d26 100644
--- a/src/lib/image.cc
+++ b/src/lib/image.cc
@@ -18,30 +18,40 @@
 */
 
 /** @file src/image.cc
- *  @brief A set of classes to describe video images.
+ *  @brief A class to describe a video image.
  */
 
-#include <sstream>
-#include <iomanip>
 #include <iostream>
-#include <sys/time.h>
-#include <boost/algorithm/string.hpp>
-#include <boost/bind.hpp>
-#include <openjpeg.h>
 extern "C" {
-#include <libavcodec/avcodec.h>
-#include <libavformat/avformat.h>
 #include <libswscale/swscale.h>
-#include <libavfilter/avfiltergraph.h>
-#include <libpostproc/postprocess.h>
 #include <libavutil/pixfmt.h>
+#include <libavutil/pixdesc.h>
+#include <libpostproc/postprocess.h>
 }
 #include "image.h"
 #include "exceptions.h"
 #include "scaler.h"
 
-using namespace std;
-using namespace boost;
+using std::string;
+using std::min;
+using std::cout;
+using boost::shared_ptr;
+using libdcp::Size;
+
+int
+Image::line_factor (int n) const
+{
+	if (n == 0) {
+		return 1;
+	}
+
+	AVPixFmtDescriptor const * d = av_pix_fmt_desc_get(_pixel_format);
+	if (!d) {
+		throw PixelFormatError ("lines()", _pixel_format);
+	}
+	
+	return pow (2.0f, d->log2_chroma_h);
+}
 
 /** @param n Component index.
  *  @return Number of lines in the image for the given component.
@@ -49,55 +59,39 @@ using namespace boost;
 int
 Image::lines (int n) const
 {
-	switch (_pixel_format) {
-	case PIX_FMT_YUV420P:
-		if (n == 0) {
-			return size().height;
-		} else {
-			return size().height / 2;
-		}
-		break;
-	case PIX_FMT_RGB24:
-	case PIX_FMT_RGBA:
-	case PIX_FMT_YUV422P10LE:
-	case PIX_FMT_YUV422P:
-		return size().height;
-	default:
-		assert (false);
-	}
-
-	return 0;
+	return rint (ceil (static_cast<double>(size().height) / line_factor (n)));
 }
 
 /** @return Number of components */
 int
 Image::components () const
 {
-	switch (_pixel_format) {
-	case PIX_FMT_YUV420P:
-	case PIX_FMT_YUV422P10LE:
-	case PIX_FMT_YUV422P:
-		return 3;
-	case PIX_FMT_RGB24:
-	case PIX_FMT_RGBA:
-		return 1;
-	default:
-		assert (false);
+	AVPixFmtDescriptor const * d = av_pix_fmt_desc_get(_pixel_format);
+	if (!d) {
+		throw PixelFormatError ("components()", _pixel_format);
 	}
 
-	return 0;
+	if ((d->flags & PIX_FMT_PLANAR) == 0) {
+		return 1;
+	}
+	
+	return d->nb_components;
 }
 
 shared_ptr<Image>
-Image::scale (Size out_size, Scaler const * scaler) const
+Image::scale (libdcp::Size out_size, Scaler const * scaler, AVPixelFormat result_format, bool result_aligned) const
 {
 	assert (scaler);
+	/* Empirical testing suggests that sws_scale() will crash if
+	   the input image is not aligned.
+	*/
+	assert (aligned ());
 
-	shared_ptr<Image> scaled (new AlignedImage (pixel_format(), out_size));
+	shared_ptr<Image> scaled (new Image (result_format, out_size, result_aligned));
 
 	struct SwsContext* scale_context = sws_getContext (
 		size().width, size().height, pixel_format(),
-		out_size.width, out_size.height, pixel_format(),
+		out_size.width, out_size.height, result_format,
 		scaler->ffmpeg_id (), 0, 0, 0
 		);
 
@@ -113,69 +107,14 @@ Image::scale (Size out_size, Scaler const * scaler) const
 	return scaled;
 }
 
-/** Scale this image to a given size and convert it to RGB.
- *  @param out_size Output image size in pixels.
- *  @param scaler Scaler to use.
- */
-shared_ptr<Image>
-Image::scale_and_convert_to_rgb (Size out_size, int padding, Scaler const * scaler) const
-{
-	assert (scaler);
-
-	Size content_size = out_size;
-	content_size.width -= (padding * 2);
-
-	shared_ptr<Image> rgb (new AlignedImage (PIX_FMT_RGB24, content_size));
-
-	struct SwsContext* scale_context = sws_getContext (
-		size().width, size().height, pixel_format(),
-		content_size.width, content_size.height, PIX_FMT_RGB24,
-		scaler->ffmpeg_id (), 0, 0, 0
-		);
-
-	/* Scale and convert to RGB from whatever its currently in (which may be RGB) */
-	sws_scale (
-		scale_context,
-		data(), stride(),
-		0, size().height,
-		rgb->data(), rgb->stride()
-		);
-
-	/* Put the image in the right place in a black frame if are padding; this is
-	   a bit grubby and expensive, but probably inconsequential in the great
-	   scheme of things.
-	*/
-	if (padding > 0) {
-		shared_ptr<Image> padded_rgb (new AlignedImage (PIX_FMT_RGB24, out_size));
-		padded_rgb->make_black ();
-
-		/* XXX: we are cheating a bit here; we know the frame is RGB so we can
-		   make assumptions about its composition.
-		*/
-		uint8_t* p = padded_rgb->data()[0] + padding * 3;
-		uint8_t* q = rgb->data()[0];
-		for (int j = 0; j < rgb->lines(0); ++j) {
-			memcpy (p, q, rgb->line_size()[0]);
-			p += padded_rgb->stride()[0];
-			q += rgb->stride()[0];
-		}
-
-		rgb = padded_rgb;
-	}
-
-	sws_freeContext (scale_context);
-
-	return rgb;
-}
-
 /** Run a FFmpeg post-process on this image and return the processed version.
  *  @param pp Flags for the required set of post processes.
  *  @return Post-processed image.
  */
 shared_ptr<Image>
-Image::post_process (string pp) const
+Image::post_process (string pp, bool aligned) const
 {
-	shared_ptr<Image> out (new AlignedImage (pixel_format(), size ()));
+	shared_ptr<Image> out (new Image (pixel_format(), size (), aligned));
 
 	int pp_format = 0;
 	switch (pixel_format()) {
@@ -184,10 +123,17 @@ Image::post_process (string pp) const
 		break;
 	case PIX_FMT_YUV422P10LE:
 	case PIX_FMT_YUV422P:
+	case PIX_FMT_UYVY422:
 		pp_format = PP_FORMAT_422;
 		break;
+	case PIX_FMT_YUV444P:
+	case PIX_FMT_YUV444P9BE:
+	case PIX_FMT_YUV444P9LE:
+	case PIX_FMT_YUV444P10BE:
+	case PIX_FMT_YUV444P10LE:
+		pp_format = PP_FORMAT_444;
 	default:
-		assert (false);
+		throw PixelFormatError ("post_process", pixel_format());
 	}
 		
 	pp_mode* mode = pp_get_mode_by_name_and_quality (pp.c_str (), PP_QUALITY_MAX);
@@ -206,29 +152,140 @@ Image::post_process (string pp) const
 	return out;
 }
 
+shared_ptr<Image>
+Image::crop (Crop crop, bool aligned) const
+{
+	libdcp::Size cropped_size = size ();
+	cropped_size.width -= crop.left + crop.right;
+	cropped_size.height -= crop.top + crop.bottom;
+
+	shared_ptr<Image> out (new Image (pixel_format(), cropped_size, aligned));
+
+	for (int c = 0; c < components(); ++c) {
+		int const crop_left_in_bytes = bytes_per_pixel(c) * crop.left;
+		/* bytes_per_pixel() could be a fraction; in this case the stride will be rounded
+		   up, and we need to make sure that we copy over the width (up to the stride)
+		   rather than short of the width; hence the ceil() here.
+		*/
+		int const cropped_width_in_bytes = ceil (bytes_per_pixel(c) * cropped_size.width);
+
+		/* Start of the source line, cropped from the top but not the left */
+		uint8_t* in_p = data()[c] + (crop.top / out->line_factor(c)) * stride()[c];
+		uint8_t* out_p = out->data()[c];
+
+		for (int y = 0; y < out->lines(c); ++y) {
+			memcpy (out_p, in_p + crop_left_in_bytes, cropped_width_in_bytes);
+			in_p += stride()[c];
+			out_p += out->stride()[c];
+		}
+	}
+
+	return out;
+}
+
+/** Blacken a YUV image whose bits per pixel is rounded up to 16 */
+void
+Image::yuv_16_black (uint16_t v)
+{
+	memset (data()[0], 0, lines(0) * stride()[0]);
+	for (int i = 1; i < 3; ++i) {
+		int16_t* p = reinterpret_cast<int16_t*> (data()[i]);
+		for (int y = 0; y < size().height; ++y) {
+			for (int x = 0; x < line_size()[i] / 2; ++x) {
+				p[x] = v;
+			}
+			p += stride()[i] / 2;
+		}
+	}
+}
+
+uint16_t
+Image::swap_16 (uint16_t v)
+{
+	return ((v >> 8) & 0xff) | ((v & 0xff) << 8);
+}
+
 void
 Image::make_black ()
 {
+	/* U/V black value for 8-bit colour */
+	static uint8_t const eight_bit_uv =	(1 << 7) - 1;
+	/* U/V black value for 9-bit colour */
+	static uint16_t const nine_bit_uv =	(1 << 8) - 1;
+	/* U/V black value for 10-bit colour */
+	static uint16_t const ten_bit_uv =	(1 << 9) - 1;
+	/* U/V black value for 16-bit colour */
+	static uint16_t const sixteen_bit_uv =	(1 << 15) - 1;
+	
 	switch (_pixel_format) {
 	case PIX_FMT_YUV420P:
-	case PIX_FMT_YUV422P10LE:
 	case PIX_FMT_YUV422P:
+	case PIX_FMT_YUV444P:
 		memset (data()[0], 0, lines(0) * stride()[0]);
-		memset (data()[1], 0x80, lines(1) * stride()[1]);
-		memset (data()[2], 0x80, lines(2) * stride()[2]);
+		memset (data()[1], eight_bit_uv, lines(1) * stride()[1]);
+		memset (data()[2], eight_bit_uv, lines(2) * stride()[2]);
+		break;
+
+	case PIX_FMT_YUVJ420P:
+	case PIX_FMT_YUVJ422P:
+	case PIX_FMT_YUVJ444P:
+		memset (data()[0], 0, lines(0) * stride()[0]);
+		memset (data()[1], eight_bit_uv + 1, lines(1) * stride()[1]);
+		memset (data()[2], eight_bit_uv + 1, lines(2) * stride()[2]);
+		break;
+
+	case PIX_FMT_YUV422P9LE:
+	case PIX_FMT_YUV444P9LE:
+		yuv_16_black (nine_bit_uv);
+		break;
+
+	case PIX_FMT_YUV422P9BE:
+	case PIX_FMT_YUV444P9BE:
+		yuv_16_black (swap_16 (nine_bit_uv));
+		break;
+		
+	case PIX_FMT_YUV422P10LE:
+	case PIX_FMT_YUV444P10LE:
+		yuv_16_black (ten_bit_uv);
+		break;
+
+	case PIX_FMT_YUV422P16LE:
+	case PIX_FMT_YUV444P16LE:
+		yuv_16_black (sixteen_bit_uv);
+		break;
+		
+	case PIX_FMT_YUV444P10BE:
+	case PIX_FMT_YUV422P10BE:
+		yuv_16_black (swap_16 (ten_bit_uv));
 		break;
 
 	case PIX_FMT_RGB24:		
 		memset (data()[0], 0, lines(0) * stride()[0]);
 		break;
 
+	case PIX_FMT_UYVY422:
+	{
+		int const Y = lines(0);
+		int const X = line_size()[0];
+		uint8_t* p = data()[0];
+		for (int y = 0; y < Y; ++y) {
+			for (int x = 0; x < X / 4; ++x) {
+				*p++ = eight_bit_uv; // Cb
+				*p++ = 0;	     // Y0
+				*p++ = eight_bit_uv; // Cr
+				*p++ = 0;	     // Y1
+			}
+		}
+		break;
+	}
+
 	default:
-		assert (false);
+		throw PixelFormatError ("make_black()", _pixel_format);
 	}
 }
 
 void
-Image::alpha_blend (shared_ptr<Image> other, Position position)
+Image::alpha_blend (shared_ptr<const Image> other, Position<int> position)
 {
 	/* Only implemented for RGBA onto RGB24 so far */
 	assert (_pixel_format == PIX_FMT_RGB24 && other->pixel_format() == PIX_FMT_RGBA);
@@ -263,13 +320,28 @@ Image::alpha_blend (shared_ptr<Image> other, Position position)
 	}
 }
 
+void
+Image::copy (shared_ptr<const Image> other, Position<int> position)
+{
+	/* Only implemented for RGB24 onto RGB24 so far */
+	assert (_pixel_format == PIX_FMT_RGB24 && other->pixel_format() == PIX_FMT_RGB24);
+	assert (position.x >= 0 && position.y >= 0);
+
+	int const N = min (position.x + other->size().width, size().width) - position.x;
+	for (int ty = position.y, oy = 0; ty < size().height && oy < other->size().height; ++ty, ++oy) {
+		uint8_t * const tp = data()[0] + ty * stride()[0] + position.x * 3;
+		uint8_t * const op = other->data()[0] + oy * other->stride()[0];
+		memcpy (tp, op, N * 3);
+	}
+}	
+
 void
 Image::read_from_socket (shared_ptr<Socket> socket)
 {
 	for (int i = 0; i < components(); ++i) {
 		uint8_t* p = data()[i];
 		for (int y = 0; y < lines(i); ++y) {
-			socket->read_definite_and_consume (p, line_size()[i], 30);
+			socket->read (p, line_size()[i]);
 			p += stride()[i];
 		}
 	}
@@ -281,21 +353,62 @@ Image::write_to_socket (shared_ptr<Socket> socket) const
 	for (int i = 0; i < components(); ++i) {
 		uint8_t* p = data()[i];
 		for (int y = 0; y < lines(i); ++y) {
-			socket->write (p, line_size()[i], 30);
+			socket->write (p, line_size()[i]);
 			p += stride()[i];
 		}
 	}
 }
 
-/** Construct a SimpleImage of a given size and format, allocating memory
+
+float
+Image::bytes_per_pixel (int c) const
+{
+	AVPixFmtDescriptor const * d = av_pix_fmt_desc_get(_pixel_format);
+	if (!d) {
+		throw PixelFormatError ("lines()", _pixel_format);
+	}
+
+	if (c >= components()) {
+		return 0;
+	}
+
+	float bpp[4] = { 0, 0, 0, 0 };
+
+	bpp[0] = floor ((d->comp[0].depth_minus1 + 1 + 7) / 8);
+	if (d->nb_components > 1) {
+		bpp[1] = floor ((d->comp[1].depth_minus1 + 1 + 7) / 8) / pow (2.0f, d->log2_chroma_w);
+	}
+	if (d->nb_components > 2) {
+		bpp[2] = floor ((d->comp[2].depth_minus1 + 1 + 7) / 8) / pow (2.0f, d->log2_chroma_w);
+	}
+	if (d->nb_components > 3) {
+		bpp[3] = floor ((d->comp[3].depth_minus1 + 1 + 7) / 8) / pow (2.0f, d->log2_chroma_w);
+	}
+	
+	if ((d->flags & PIX_FMT_PLANAR) == 0) {
+		/* Not planar; sum them up */
+		return bpp[0] + bpp[1] + bpp[2] + bpp[3];
+	}
+
+	return bpp[c];
+}
+
+/** Construct a Image of a given size and format, allocating memory
  *  as required.
  *
  *  @param p Pixel format.
  *  @param s Size in pixels.
  */
-SimpleImage::SimpleImage (AVPixelFormat p, Size s, function<int (int)> rounder)
-	: Image (p)
-	, _size (s)
+Image::Image (AVPixelFormat p, libdcp::Size s, bool aligned)
+	: libdcp::Image (s)
+	, _pixel_format (p)
+	, _aligned (aligned)
+{
+	allocate ();
+}
+
+void
+Image::allocate ()
 {
 	_data = (uint8_t **) av_malloc (4 * sizeof (uint8_t *));
 	_data[0] = _data[1] = _data[2] = _data[3] = 0;
@@ -306,147 +419,146 @@ SimpleImage::SimpleImage (AVPixelFormat p, Size s, function<int (int)> rounder)
 	_stride = (int *) av_malloc (4 * sizeof (int));
 	_stride[0] = _stride[1] = _stride[2] = _stride[3] = 0;
 
-	switch (p) {
-	case PIX_FMT_RGB24:
-		_line_size[0] = s.width * 3;
-		break;
-	case PIX_FMT_RGBA:
-		_line_size[0] = s.width * 4;
-		break;
-	case PIX_FMT_YUV420P:
-	case PIX_FMT_YUV422P:
-		_line_size[0] = s.width;
-		_line_size[1] = s.width / 2;
-		_line_size[2] = s.width / 2;
-		break;
-	case PIX_FMT_YUV422P10LE:
-		_line_size[0] = s.width * 2;
-		_line_size[1] = s.width;
-		_line_size[2] = s.width;
-		break;
-	default:
-		assert (false);
-	}
-
 	for (int i = 0; i < components(); ++i) {
-		_stride[i] = rounder (_line_size[i]);
-		_data[i] = (uint8_t *) av_malloc (_stride[i] * lines (i));
+		_line_size[i] = ceil (_size.width * bytes_per_pixel(i));
+		_stride[i] = stride_round_up (i, _line_size, _aligned ? 32 : 1);
+
+		/* The assembler function ff_rgb24ToY_avx (in libswscale/x86/input.asm)
+		   uses a 16-byte fetch to read three bytes (R/G/B) of image data.
+		   Hence on the last pixel of the last line it reads over the end of
+		   the actual data by 1 byte.  If the width of an image is a multiple
+		   of the stride alignment there will be no padding at the end of image lines.
+		   OS X crashes on this illegal read, though other operating systems don't
+		   seem to mind.  The nasty + 1 in this malloc makes sure there is always a byte
+		   for that instruction to read safely.
+		*/
+		_data[i] = (uint8_t *) av_malloc (_stride[i] * lines (i) + 1);
 	}
 }
 
-/** Destroy a SimpleImage */
-SimpleImage::~SimpleImage ()
+Image::Image (Image const & other)
+	: libdcp::Image (other)
+	,  _pixel_format (other._pixel_format)
+	, _aligned (other._aligned)
 {
+	allocate ();
+
 	for (int i = 0; i < components(); ++i) {
-		av_free (_data[i]);
+		uint8_t* p = _data[i];
+		uint8_t* q = other._data[i];
+		for (int j = 0; j < lines(i); ++j) {
+			memcpy (p, q, _line_size[i]);
+			p += stride()[i];
+			q += other.stride()[i];
+		}
 	}
-
-	av_free (_data);
-	av_free (_line_size);
-	av_free (_stride);
 }
 
-uint8_t **
-SimpleImage::data () const
+Image::Image (AVFrame* frame)
+	: libdcp::Image (libdcp::Size (frame->width, frame->height))
+	, _pixel_format (static_cast<AVPixelFormat> (frame->format))
+	, _aligned (true)
 {
-	return _data;
-}
+	allocate ();
 
-int *
-SimpleImage::line_size () const
-{
-	return _line_size;
+	for (int i = 0; i < components(); ++i) {
+		uint8_t* p = _data[i];
+		uint8_t* q = frame->data[i];
+		for (int j = 0; j < lines(i); ++j) {
+			memcpy (p, q, _line_size[i]);
+			p += stride()[i];
+			/* AVFrame's linesize is what we call `stride' */
+			q += frame->linesize[i];
+		}
+	}
 }
 
-int *
-SimpleImage::stride () const
+Image::Image (shared_ptr<const Image> other, bool aligned)
+	: libdcp::Image (other)
+	, _pixel_format (other->_pixel_format)
+	, _aligned (aligned)
 {
-	return _stride;
-}
+	allocate ();
 
-Size
-SimpleImage::size () const
-{
-	return _size;
+	for (int i = 0; i < components(); ++i) {
+		assert(line_size()[i] == other->line_size()[i]);
+		uint8_t* p = _data[i];
+		uint8_t* q = other->data()[i];
+		for (int j = 0; j < lines(i); ++j) {
+			memcpy (p, q, line_size()[i]);
+			p += stride()[i];
+			q += other->stride()[i];
+		}
+	}
 }
 
-AlignedImage::AlignedImage (AVPixelFormat f, Size s)
-	: SimpleImage (f, s, boost::bind (round_up, _1, 32))
+Image&
+Image::operator= (Image const & other)
 {
+	if (this == &other) {
+		return *this;
+	}
 
+	Image tmp (other);
+	swap (tmp);
+	return *this;
 }
 
-CompactImage::CompactImage (AVPixelFormat f, Size s)
-	: SimpleImage (f, s, boost::bind (round_up, _1, 1))
-{
-	setup_picture ();
-}
-
-CompactImage::CompactImage (shared_ptr<Image> im)
-	: SimpleImage (im->pixel_format(), im->size(), boost::bind (round_up, _1, 1))
+void
+Image::swap (Image & other)
 {
-	assert (components() == im->components());
-
-	for (int c = 0; c < components(); ++c) {
-
-		assert (line_size()[c] == im->line_size()[c]);
+	libdcp::Image::swap (other);
+	
+	std::swap (_pixel_format, other._pixel_format);
 
-		uint8_t* t = data()[c];
-		uint8_t* o = im->data()[c];
-		
-		for (int y = 0; y < lines(c); ++y) {
-			memcpy (t, o, line_size()[c]);
-			t += stride()[c];
-			o += im->stride()[c];
-		}
+	for (int i = 0; i < 4; ++i) {
+		std::swap (_data[i], other._data[i]);
+		std::swap (_line_size[i], other._line_size[i]);
+		std::swap (_stride[i], other._stride[i]);
 	}
 
-	setup_picture ();
+	std::swap (_aligned, other._aligned);
 }
 
-void
-CompactImage::setup_picture ()
+/** Destroy a Image */
+Image::~Image ()
 {
-	for (int c = 0; c < components(); ++c) {
-		_picture.data[c] = data()[c];
-		_picture.linesize[c] = line_size()[c];
+	for (int i = 0; i < components(); ++i) {
+		av_free (_data[i]);
 	}
-}
-
-FilterBufferImage::FilterBufferImage (AVPixelFormat p, AVFilterBufferRef* b)
-	: Image (p)
-	, _buffer (b)
-{
 
+	av_free (_data);
+	av_free (_line_size);
+	av_free (_stride);
 }
 
-FilterBufferImage::~FilterBufferImage ()
+uint8_t **
+Image::data () const
 {
-	avfilter_unref_buffer (_buffer);
+	return _data;
 }
 
-uint8_t **
-FilterBufferImage::data () const
+int *
+Image::line_size () const
 {
-	return _buffer->data;
+	return _line_size;
 }
 
 int *
-FilterBufferImage::line_size () const
+Image::stride () const
 {
-	return _buffer->linesize;
+	return _stride;
 }
 
-int *
-FilterBufferImage::stride () const
+libdcp::Size
+Image::size () const
 {
-	/* XXX? */
-	return _buffer->linesize;
+	return _size;
 }
 
-Size
-FilterBufferImage::size () const
+bool
+Image::aligned () const
 {
-	return Size (_buffer->video->w, _buffer->video->h);
+	return _aligned;
 }