summaryrefslogtreecommitdiff
path: root/src/lib/j2k_wav_encoder.cc
diff options
context:
space:
mode:
authorCarl Hetherington <cth@carlh.net>2012-09-29 23:41:25 +0100
committerCarl Hetherington <cth@carlh.net>2012-09-29 23:41:25 +0100
commitf3fdae3f8f4ae54b17f925f81a5e9d4b3589269b (patch)
treedc80a1c814b67e15b7bba8902b3a331ce9ea2d80 /src/lib/j2k_wav_encoder.cc
parent1774f34b5420c0526991f3f1b621d9ca53eaf345 (diff)
Entirely untested resampling to fix 24fps drop-frame.
Diffstat (limited to 'src/lib/j2k_wav_encoder.cc')
-rw-r--r--src/lib/j2k_wav_encoder.cc137
1 files changed, 132 insertions, 5 deletions
diff --git a/src/lib/j2k_wav_encoder.cc b/src/lib/j2k_wav_encoder.cc
index 9ae01c774..86c3ae13f 100644
--- a/src/lib/j2k_wav_encoder.cc
+++ b/src/lib/j2k_wav_encoder.cc
@@ -46,6 +46,9 @@ using namespace boost;
J2KWAVEncoder::J2KWAVEncoder (shared_ptr<const FilmState> s, shared_ptr<const Options> o, Log* l)
: Encoder (s, o, l)
+#ifdef HAVE_SWRESAMPLE
+ , _swr_context (0)
+#endif
, _deinterleave_buffer_size (8192)
, _deinterleave_buffer (0)
, _process_end (false)
@@ -210,8 +213,31 @@ J2KWAVEncoder::encoder_thread (ServerDescription* server)
}
void
-J2KWAVEncoder::process_begin ()
+J2KWAVEncoder::process_begin (int64_t audio_channel_layout, AVSampleFormat audio_sample_format)
{
+ if ((_fs->audio_sample_rate != dcp_audio_sample_rate (_fs->audio_sample_rate)) || (rint (_fs->frames_per_second) != _fs->frames_per_second)) {
+#ifdef HAVE_SWRESAMPLE
+ _swr_context = swr_alloc_set_opts (
+ 0,
+ audio_channel_layout,
+ audio_sample_format,
+ target_sample_rate(),
+ audio_channel_layout,
+ audio_sample_format,
+ _fs->audio_sample_rate,
+ 0, 0
+ );
+
+ swr_init (_swr_context);
+#else
+ throw EncodeError ("Cannot resample audio as libswresample is not present");
+#endif
+ } else {
+#ifdef HAVE_SWRESAMPLE
+ _swr_context = 0;
+#endif
+ }
+
for (int i = 0; i < Config::instance()->num_local_encoding_threads (); ++i) {
_worker_threads.push_back (new boost::thread (boost::bind (&J2KWAVEncoder::encoder_thread, this, (ServerDescription *) 0)));
}
@@ -268,6 +294,34 @@ J2KWAVEncoder::process_end ()
_log->log (s.str ());
}
}
+
+#if HAVE_SWRESAMPLE
+ if (_swr_context) {
+
+ int mop = 0;
+ while (1) {
+ uint8_t buffer[256 * _fs->bytes_per_sample() * _fs->audio_channels];
+ uint8_t* out[1] = {
+ buffer
+ };
+
+ int const frames = swr_convert (_swr_context, out, 256, 0, 0);
+
+ if (frames < 0) {
+ throw EncodeError ("could not run sample-rate converter");
+ }
+
+ if (frames == 0) {
+ break;
+ }
+
+ mop += frames;
+ write_audio (buffer, frames);
+ }
+
+ swr_free (&_swr_context);
+ }
+#endif
close_sound_files ();
@@ -281,11 +335,64 @@ J2KWAVEncoder::process_end ()
}
void
-J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
+J2KWAVEncoder::process_audio (uint8_t* data, int size)
+{
+ /* This is a buffer we might use if we are sample-rate converting;
+ it will need freeing if so.
+ */
+ uint8_t* out_buffer = 0;
+
+ /* Maybe sample-rate convert */
+#if HAVE_SWRESAMPLE
+ if (_swr_context) {
+
+ uint8_t const * in[2] = {
+ data,
+ 0
+ };
+
+ /* Here's samples per channel */
+ int const samples = size / _fs->bytes_per_sample();
+
+ /* And here's frames (where 1 frame is a collection of samples, 1 for each channel,
+ so for 5.1 a frame would be 6 samples)
+ */
+ int const frames = samples / _fs->audio_channels;
+
+ /* Compute the resampled frame count and add 32 for luck */
+ int const out_buffer_size_frames = ceil (frames * target_sample_rate() / _fs->audio_sample_rate) + 32;
+ int const out_buffer_size_bytes = out_buffer_size_frames * _fs->audio_channels * _fs->bytes_per_sample();
+ out_buffer = new uint8_t[out_buffer_size_bytes];
+
+ uint8_t* out[2] = {
+ out_buffer,
+ 0
+ };
+
+ /* Resample audio */
+ int out_frames = swr_convert (_swr_context, out, out_buffer_size_frames, in, size);
+ if (out_frames < 0) {
+ throw EncodeError ("could not run sample-rate converter");
+ }
+
+ /* And point our variables at the resampled audio */
+ data = out_buffer;
+ size = out_frames * _fs->audio_channels * _fs->bytes_per_sample();
+ }
+#endif
+
+ write_audio (data, size);
+
+ /* Delete the sample-rate conversion buffer, if it exists */
+ delete[] out_buffer;
+}
+
+void
+J2KWAVEncoder::write_audio (uint8_t* data, int size)
{
/* Size of a sample in bytes */
int const sample_size = 2;
-
+
/* XXX: we are assuming that sample_size is right, the _deinterleave_buffer_size is a multiple
of the sample size and that data_size is a multiple of _fs->audio_channels * sample_size.
*/
@@ -293,7 +400,7 @@ J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
/* XXX: this code is very tricksy and it must be possible to make it simpler ... */
/* Number of bytes left to read this time */
- int remaining = data_size;
+ int remaining = size;
/* Our position in the output buffers, in bytes */
int position = 0;
while (remaining > 0) {
@@ -313,7 +420,7 @@ J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
sf_write_short (_sound_files[i], (const short *) _deinterleave_buffer, this_time / sample_size);
break;
default:
- throw DecodeError ("unknown audio sample format");
+ throw EncodeError ("unknown audio sample format");
}
}
@@ -321,3 +428,23 @@ J2KWAVEncoder::process_audio (uint8_t* data, int data_size)
remaining -= this_time * _fs->audio_channels;
}
}
+
+int
+J2KWAVEncoder::target_sample_rate () const
+{
+ double t = dcp_audio_sample_rate (_fs->audio_sample_rate);
+ if (rint (_fs->frames_per_second) != _fs->frames_per_second) {
+ if (_fs->frames_per_second == 23.976) {
+ /* 24fps drop-frame ie 24 * 1000 / 1001 frames per second;
+ hence we need to resample the audio to dcp_audio_sample_rate * 1000 / 1001
+ so that when we play it back at dcp_audio_sample_rate it is sped up
+ by the same amount that the video is
+ */
+ t *= double(1000) / 1001;
+ } else {
+ throw EncodeError ("unknown fractional frame rate");
+ }
+ }
+
+ return rint (t);
+}