Basic grunt-work, untested and unfinished, but it compiles.
[dcpomatic.git] / src / lib / analyse_audio_job.cc
1 /*
2     Copyright (C) 2012-2015 Carl Hetherington <cth@carlh.net>
3
4     This file is part of DCP-o-matic.
5
6     DCP-o-matic is free software; you can redistribute it and/or modify
7     it under the terms of the GNU General Public License as published by
8     the Free Software Foundation; either version 2 of the License, or
9     (at your option) any later version.
10
11     DCP-o-matic is distributed in the hope that it will be useful,
12     but WITHOUT ANY WARRANTY; without even the implied warranty of
13     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14     GNU General Public License for more details.
15
16     You should have received a copy of the GNU General Public License
17     along with DCP-o-matic.  If not, see <http://www.gnu.org/licenses/>.
18
19 */
20
21 #include "audio_analysis.h"
22 #include "audio_buffers.h"
23 #include "analyse_audio_job.h"
24 #include "audio_content.h"
25 #include "compose.hpp"
26 #include "film.h"
27 #include "player.h"
28 #include "playlist.h"
29 #include "filter.h"
30 #include "audio_filter_graph.h"
31 #include "config.h"
32 extern "C" {
33 #include <libavutil/channel_layout.h>
34 #ifdef DCPOMATIC_HAVE_EBUR128_PATCHED_FFMPEG
35 #include <libavfilter/f_ebur128.h>
36 #endif
37 }
38 #include <boost/foreach.hpp>
39 #include <iostream>
40
41 #include "i18n.h"
42
43 using std::string;
44 using std::vector;
45 using std::max;
46 using std::min;
47 using std::cout;
48 using boost::shared_ptr;
49 using boost::dynamic_pointer_cast;
50
51 int const AnalyseAudioJob::_num_points = 1024;
52
53 AnalyseAudioJob::AnalyseAudioJob (shared_ptr<const Film> film, shared_ptr<const Playlist> playlist)
54         : Job (film)
55         , _playlist (playlist)
56         , _done (0)
57         , _samples_per_point (1)
58         , _current (0)
59         , _sample_peak (new float[film->audio_channels()])
60         , _sample_peak_frame (new Frame[film->audio_channels()])
61 #ifdef DCPOMATIC_HAVE_EBUR128_PATCHED_FFMPEG
62         , _ebur128 (new AudioFilterGraph (film->audio_frame_rate(), film->audio_channels()))
63 #endif
64 {
65 #ifdef DCPOMATIC_HAVE_EBUR128_PATCHED_FFMPEG
66         _filters.push_back (new Filter ("ebur128", "ebur128", "audio", "ebur128=peak=true"));
67         _ebur128->setup (_filters);
68 #endif
69
70         for (int i = 0; i < film->audio_channels(); ++i) {
71                 _sample_peak[i] = 0;
72                 _sample_peak_frame[i] = 0;
73         }
74 }
75
76 AnalyseAudioJob::~AnalyseAudioJob ()
77 {
78         BOOST_FOREACH (Filter const * i, _filters) {
79                 delete const_cast<Filter*> (i);
80         }
81         delete[] _current;
82         delete[] _sample_peak;
83         delete[] _sample_peak_frame;
84 }
85
86 string
87 AnalyseAudioJob::name () const
88 {
89         return _("Analyse audio");
90 }
91
92 string
93 AnalyseAudioJob::json_name () const
94 {
95         return N_("analyse_audio");
96 }
97
98 void
99 AnalyseAudioJob::run ()
100 {
101         shared_ptr<Player> player (new Player (_film, _playlist));
102         player->set_ignore_video ();
103         player->set_fast ();
104         player->set_play_referenced ();
105         player->Audio.connect (bind (&AnalyseAudioJob::analyse, this, _1, _2));
106
107         DCPTime const start = _playlist->start().get_value_or (DCPTime ());
108         DCPTime const length = _playlist->length ();
109
110         Frame const len = DCPTime (length - start).frames_round (_film->audio_frame_rate());
111         _samples_per_point = max (int64_t (1), len / _num_points);
112
113         delete[] _current;
114         _current = new AudioPoint[_film->audio_channels ()];
115         _analysis.reset (new AudioAnalysis (_film->audio_channels ()));
116
117         bool has_any_audio = false;
118         BOOST_FOREACH (shared_ptr<Content> c, _playlist->content ()) {
119                 if (c->audio) {
120                         has_any_audio = true;
121                 }
122         }
123
124         if (has_any_audio) {
125                 _done = 0;
126                 while (!player->pass ()) {}
127         }
128
129         vector<AudioAnalysis::PeakTime> sample_peak;
130         for (int i = 0; i < _film->audio_channels(); ++i) {
131                 sample_peak.push_back (
132                         AudioAnalysis::PeakTime (_sample_peak[i], DCPTime::from_frames (_sample_peak_frame[i], _film->audio_frame_rate ()))
133                         );
134         }
135         _analysis->set_sample_peak (sample_peak);
136
137 #ifdef DCPOMATIC_HAVE_EBUR128_PATCHED_FFMPEG
138         if (Config::instance()->analyse_ebur128 ()) {
139                 void* eb = _ebur128->get("Parsed_ebur128_0")->priv;
140                 vector<float> true_peak;
141                 for (int i = 0; i < _film->audio_channels(); ++i) {
142                         true_peak.push_back (av_ebur128_get_true_peaks(eb)[i]);
143                 }
144                 _analysis->set_true_peak (true_peak);
145                 _analysis->set_integrated_loudness (av_ebur128_get_integrated_loudness(eb));
146                 _analysis->set_loudness_range (av_ebur128_get_loudness_range(eb));
147         }
148 #endif
149
150         if (_playlist->content().size() == 1) {
151                 /* If there was only one piece of content in this analysis we may later need to know what its
152                    gain was when we analysed it.
153                 */
154                 shared_ptr<const AudioContent> ac = _playlist->content().front()->audio;
155                 DCPOMATIC_ASSERT (ac);
156                 _analysis->set_analysis_gain (ac->gain ());
157         }
158
159         _analysis->write (_film->audio_analysis_path (_playlist));
160
161         set_progress (1);
162         set_state (FINISHED_OK);
163 }
164
165 void
166 AnalyseAudioJob::analyse (shared_ptr<const AudioBuffers> b, DCPTime time)
167 {
168 #ifdef DCPOMATIC_HAVE_EBUR128_PATCHED_FFMPEG
169         if (Config::instance()->analyse_ebur128 ()) {
170                 _ebur128->process (b);
171         }
172 #endif
173
174         int const frames = b->frames ();
175         int const channels = b->channels ();
176
177         for (int j = 0; j < channels; ++j) {
178                 float* data = b->data(j);
179                 for (int i = 0; i < frames; ++i) {
180                         float s = data[i];
181                         float as = fabsf (s);
182                         if (as < 10e-7) {
183                                 /* We may struggle to serialise and recover inf or -inf, so prevent such
184                                    values by replacing with this (140dB down) */
185                                 s = as = 10e-7;
186                         }
187                         _current[j][AudioPoint::RMS] += pow (s, 2);
188                         _current[j][AudioPoint::PEAK] = max (_current[j][AudioPoint::PEAK], as);
189
190                         if (as > _sample_peak[j]) {
191                                 _sample_peak[j] = as;
192                                 _sample_peak_frame[j] = _done + i;
193                         }
194
195                         if (((_done + i) % _samples_per_point) == 0) {
196                                 _current[j][AudioPoint::RMS] = sqrt (_current[j][AudioPoint::RMS] / _samples_per_point);
197                                 _analysis->add_point (j, _current[j]);
198                                 _current[j] = AudioPoint ();
199                         }
200                 }
201         }
202
203         _done += frames;
204
205         DCPTime const start = _playlist->start().get_value_or (DCPTime ());
206         DCPTime const length = _playlist->length ();
207         set_progress ((time.seconds() - start.seconds()) / (length.seconds() - start.seconds()));
208 }