Entirely untested resampling to fix 24fps drop-frame.

author: Carl Hetherington <cth@carlh.net> 2012-09-29 23:41:25 +0100
committer: Carl Hetherington <cth@carlh.net> 2012-09-29 23:41:25 +0100
commit: f3fdae3f8f4ae54b17f925f81a5e9d4b3589269b (patch)
tree: dc80a1c814b67e15b7bba8902b3a331ce9ea2d80 /src/lib/j2k_wav_encoder.cc
parent: 1774f34b5420c0526991f3f1b621d9ca53eaf345 (diff)
1 files changed, 132 insertions, 5 deletions
diff --git a/src/lib/j2k_wav_encoder.cc b/src/lib/j2k_wav_encoder.cc
index 9ae01c774..86c3ae13f 100644
--- a/src/lib/j2k_wav_encoder.cc
+++ b/src/lib/j2k_wav_encoder.cc
@@ -46,6 +46,9 @@ using namespace boost;
 
 J2KWAVEncoder::J2KWAVEncoder (shared_ptr<const FilmState> s, shared_ptr<const Options> o, Log* l)
 	: Encoder (s, o, l)
+#ifdef HAVE_SWRESAMPLE	  
+	, _swr_context (0)
+#endif	  
 	, _deinterleave_buffer_size (8192)
 	, _deinterleave_buffer (0)
 	, _process_end (false)
@@ -210,8 +213,31 @@ J2KWAVEncoder::encoder_thread (ServerDescription* server)
 }
 
 void
-J2KWAVEncoder::process_begin ()
+J2KWAVEncoder::process_begin (int64_t audio_channel_layout, AVSampleFormat audio_sample_format)
 {
+	if ((_fs->audio_sample_rate != dcp_audio_sample_rate (_fs->audio_sample_rate)) || (rint (_fs->frames_per_second) != _fs->frames_per_second)) {
+#ifdef HAVE_SWRESAMPLE		
+		_swr_context = swr_alloc_set_opts (
+			0,
+			audio_channel_layout,
+			audio_sample_format,
+			target_sample_rate(),
+			audio_channel_layout,
+			audio_sample_format,
+			_fs->audio_sample_rate,
+			0, 0
+			);
+		
+		swr_init (_swr_context);
+#else
+		throw EncodeError ("Cannot resample audio as libswresample is not present");
+#endif
+	} else {
+#ifdef HAVE_SWRESAMPLE
+		_swr_context = 0;
+#endif		
+	}
+	
 	for (int i = 0; i < Config::instance()->num_local_encoding_threads (); ++i) {
 		_worker_threads.push_back (new boost::thread (boost::bind (&J2KWAVEncoder::encoder_thread, this, (ServerDescription *) 0)));
 	}
@@ -268,6 +294,34 @@ J2KWAVEncoder::process_end ()
 			_log->log (s.str ());
 		}
 	}
+
+#if HAVE_SWRESAMPLE	
+	if (_swr_context) {
+
+		int mop = 0;
+		while (1) {
+			uint8_t buffer[256 * _fs->bytes_per_sample() * _fs->audio_channels];
+			uint8_t* out[1] = {
+				buffer
+			};
+
+			int const frames = swr_convert (_swr_context, out, 256, 0, 0);
+
+			if (frames < 0) {
+				throw EncodeError ("could not run sample-rate converter");
+			}
+
+			if (frames == 0) {
+				break;
+			}
+
+			mop += frames;
+			write_audio (buffer, frames);
+		}
+
+		swr_free (&_swr_context);
+	}
+#endif	
 	
 	close_sound_files ();
 
@@ -281,11 +335,64 @@ J2KWAVEncoder::process_end ()
 }
 
 void
-J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
+J2KWAVEncoder::process_audio (uint8_t* data, int size)
+{
+	/* This is a buffer we might use if we are sample-rate converting;
+	   it will need freeing if so.
+	*/
+	uint8_t* out_buffer = 0;
+	
+	/* Maybe sample-rate convert */
+#if HAVE_SWRESAMPLE	
+	if (_swr_context) {
+
+		uint8_t const * in[2] = {
+			data,
+			0
+		};
+
+		/* Here's samples per channel */
+		int const samples = size / _fs->bytes_per_sample();
+		
+		/* And here's frames (where 1 frame is a collection of samples, 1 for each channel,
+		   so for 5.1 a frame would be 6 samples)
+		*/
+		int const frames = samples / _fs->audio_channels;
+
+		/* Compute the resampled frame count and add 32 for luck */
+		int const out_buffer_size_frames = ceil (frames * target_sample_rate() / _fs->audio_sample_rate) + 32;
+		int const out_buffer_size_bytes = out_buffer_size_frames * _fs->audio_channels * _fs->bytes_per_sample();
+		out_buffer = new uint8_t[out_buffer_size_bytes];
+
+		uint8_t* out[2] = {
+			out_buffer, 
+			0
+		};
+
+		/* Resample audio */
+		int out_frames = swr_convert (_swr_context, out, out_buffer_size_frames, in, size);
+		if (out_frames < 0) {
+			throw EncodeError ("could not run sample-rate converter");
+		}
+
+		/* And point our variables at the resampled audio */
+		data = out_buffer;
+		size = out_frames * _fs->audio_channels * _fs->bytes_per_sample();
+	}
+#endif
+
+	write_audio (data, size);
+
+	/* Delete the sample-rate conversion buffer, if it exists */
+	delete[] out_buffer;
+}
+
+void
+J2KWAVEncoder::write_audio (uint8_t* data, int size)
 {
 	/* Size of a sample in bytes */
 	int const sample_size = 2;
-	
+
 	/* XXX: we are assuming that sample_size is right, the _deinterleave_buffer_size is a multiple
 	   of the sample size and that data_size is a multiple of _fs->audio_channels * sample_size.
 	*/
@@ -293,7 +400,7 @@ J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
 	/* XXX: this code is very tricksy and it must be possible to make it simpler ... */
 	
 	/* Number of bytes left to read this time */
-	int remaining = data_size;
+	int remaining = size;
 	/* Our position in the output buffers, in bytes */
 	int position = 0;
 	while (remaining > 0) {
@@ -313,7 +420,7 @@ J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
 				sf_write_short (_sound_files[i], (const short *) _deinterleave_buffer, this_time / sample_size);
 				break;
 			default:
-				throw DecodeError ("unknown audio sample format");
+				throw EncodeError ("unknown audio sample format");
 			}
 		}
 		
@@ -321,3 +428,23 @@ J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
 		remaining -= this_time * _fs->audio_channels;
 	}
 }
+
+int
+J2KWAVEncoder::target_sample_rate () const
+{
+	double t = dcp_audio_sample_rate (_fs->audio_sample_rate);
+	if (rint (_fs->frames_per_second) != _fs->frames_per_second) {
+		if (_fs->frames_per_second == 23.976) {
+			/* 24fps drop-frame ie 24 * 1000 / 1001 frames per second;
+			   hence we need to resample the audio to dcp_audio_sample_rate * 1000 / 1001
+			   so that when we play it back at dcp_audio_sample_rate it is sped up
+			   by the same amount that the video is
+			*/
+			t *= double(1000) / 1001;
+		} else {
+			throw EncodeError ("unknown fractional frame rate");
+		}
+	}
+
+	return rint (t);
+}
author	Carl Hetherington <cth@carlh.net>	2012-09-29 23:41:25 +0100
committer	Carl Hetherington <cth@carlh.net>	2012-09-29 23:41:25 +0100
commit	f3fdae3f8f4ae54b17f925f81a5e9d4b3589269b (patch)
tree	dc80a1c814b67e15b7bba8902b3a331ce9ea2d80 /src/lib/j2k_wav_encoder.cc
parent	1774f34b5420c0526991f3f1b621d9ca53eaf345 (diff)