2 Copyright (C) 2010-2013 Paul Davis
3 Author: Robin Gareus <robin@gareus.org>
5 This program is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 2 of the License, or
8 (at your option) any later version.
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with this program; if not, write to the Free Software
17 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
23 #include <sys/types.h>
25 #include "pbd/error.h"
26 #include "pbd/convert.h"
27 #include "pbd/file_utils.h"
28 #include "gui_thread.h"
30 #include "transcode_ffmpeg.h"
31 #include "utils_videotl.h"
32 #include "video_tool_paths.h"
37 using namespace VideoUtils;
39 TranscodeFfmpeg::TranscodeFfmpeg (std::string f)
45 m_avoffset = m_lead_in = m_lead_out = 0;
46 m_width = m_height = 0;
49 #if 1 /* tentative debug mode */
53 if (!ArdourVideoToolPaths::transcoder_exe(ffmpeg_exe, ffprobe_exe)) {
54 warning << string_compose(
56 "No ffprobe or ffmpeg executables could be found on this system.\n"
57 "Video import and export is not possible until you install those tools.\n"
58 "%1 requires ffmpeg and ffprobe from ffmpeg.org - version 1.1 or newer.\n"
60 "The tools are included with the %1 releases from ardour.org "
61 "and also available with the video-server at http://x42.github.com/harvid/\n"
63 "Important: the files need to be installed in $PATH and named ffmpeg_harvid and ffprobe_harvid.\n"
64 "If you already have a suitable ffmpeg installation on your system, we recommend creating "
65 "symbolic links from ffmpeg to ffmpeg_harvid and from ffprobe to ffprobe_harvid.\n"
67 "see also http://manual.ardour.org/video-timeline/setup/"
68 ), PROGRAM_NAME) << endmsg;
73 if (infile.empty() || !probe()) {
79 TranscodeFfmpeg::~TranscodeFfmpeg ()
85 TranscodeFfmpeg::probe ()
89 argp=(char**) calloc(7,sizeof(char*));
90 argp[0] = strdup(ffprobe_exe.c_str());
91 argp[1] = strdup("-print_format");
92 argp[2] = strdup("csv=nk=0");
93 argp[3] = strdup("-show_format");
94 argp[4] = strdup("-show_streams");
95 argp[5] = strdup(infile.c_str());
97 ffcmd = new ARDOUR::SystemExec(ffprobe_exe, argp);
98 ffcmd->ReadStdout.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffprobeparse, this, _1 ,_2));
99 ffcmd->Terminated.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffexit, this));
100 if (ffcmd->start(1)) {
105 /* wait for ffprobe process to exit */
108 /* wait for interposer thread to copy all data.
109 * SystemExec::Terminated is emitted and ffcmd set to NULL */
110 int timeout = 300; // 1.5 sec
111 while (ffcmd && --timeout > 0) {
114 if (timeout == 0 || ffoutput.empty()) {
120 std::vector<std::vector<std::string> > lines;
121 ParseCSV(ffoutput, lines);
123 m_width = m_height = 0;
124 m_fps = m_aspect = 0;
130 #define PARSE_FRACTIONAL_FPS(VAR) \
132 std::string::size_type pos; \
134 pos = value.find_first_of('/'); \
135 if (pos != std::string::npos) { \
136 VAR = atof(value.substr(0, pos)) / atof(value.substr(pos+1)); \
140 for (std::vector<std::vector<std::string> >::iterator i = lines.begin(); i != lines.end(); ++i) {
141 if (i->at(0) == X_("format")) {
142 /* format,filename,#streams,format-name,format-long-name,start-time,duration,size,bitrate */
144 if (i->at(0) == X_("stream")) {
145 if (i->at(5) == X_("codec_type=video") && m_width == 0) {
147 for (std::vector<std::string>::iterator kv = i->begin(); kv != i->end(); ++kv) {
148 const size_t kvsep = kv->find('=');
149 if(kvsep == std::string::npos) continue;
150 std::string key = kv->substr(0, kvsep);
151 std::string value = kv->substr(kvsep + 1);
153 if (key == X_("index")) {
154 m_videoidx = atoi(value);
155 } else if (key == X_("width")) {
156 m_width = atoi(value);
157 } else if (key == X_("height")) {
158 m_height = atoi(value);
159 } else if (key == X_("codec_name")) {
160 if (!m_codec.empty()) m_codec += " ";
162 } else if (key == X_("codec_long_name")) {
163 if (!m_codec.empty()) m_codec += " ";
164 m_codec += "[" + value + "]";
165 } else if (key == X_("codec_tag_string")) {
166 if (!m_codec.empty()) m_codec += " ";
167 m_codec += "(" + value + ")";
168 } else if (key == X_("r_frame_rate")) {
169 PARSE_FRACTIONAL_FPS(m_fps)
170 } else if (key == X_("avg_frame_rate") && m_fps == 0) {
171 PARSE_FRACTIONAL_FPS(m_fps)
172 } else if (key == X_("time_base")) {
173 PARSE_FRACTIONAL_FPS(timebase)
174 } else if (key == X_("timecode") && m_duration == 0) {
175 int h,m,s; char f[7];
176 if (sscanf(i->at(16).c_str(), "%d:%d:%d:%s",&h,&m,&s,f) == 4) {
177 m_duration = (ARDOUR::framecnt_t) floor(m_fps * (
181 + atoi(f) / pow((double)10, (int)strlen(f))
184 } else if (key == X_("duration_ts") && m_fps == 0 && timebase !=0 ) {
185 m_duration = atof(value) * m_fps * timebase;
186 } else if (key == X_("duration") && m_fps != 0 && m_duration == 0) {
187 m_duration = atof(value) * m_fps;
188 } else if (key == X_("sample_aspect_ratio")) {
189 std::string::size_type pos;
190 pos = value.find_first_of(':');
191 if (pos != std::string::npos && atof(value.substr(pos+1)) != 0) {
193 m_sar.replace(pos, 1, "/");
195 } else if (key == X_("display_aspect_ratio")) {
196 std::string::size_type pos;
197 pos = value.find_first_of(':');
198 if (pos != std::string::npos && atof(value.substr(pos+1)) != 0) {
199 m_aspect = atof(value.substr(0, pos)) / atof(value.substr(pos+1));
205 m_aspect = (double)m_width / (double)m_height;
208 } else if (i->at(5) == X_("codec_type=audio")) { /* new ffprobe */
210 for (std::vector<std::string>::iterator kv = i->begin(); kv != i->end(); ++kv) {
211 const size_t kvsep = kv->find('=');
212 if(kvsep == std::string::npos) continue;
213 std::string key = kv->substr(0, kvsep);
214 std::string value = kv->substr(kvsep + 1);
216 if (key == X_("channels")) {
217 as.channels = atoi(value);
218 } else if (key == X_("index")) {
219 as.stream_id = value;
220 } else if (key == X_("codec_long_name")) {
221 if (!as.name.empty()) as.name += " ";
223 } else if (key == X_("codec_name")) {
224 if (!as.name.empty()) as.name += " ";
226 } else if (key == X_("sample_fmt")) {
227 if (!as.name.empty()) as.name += " ";
228 as.name += "FMT:" + value;
229 } else if (key == X_("sample_rate")) {
230 if (!as.name.empty()) as.name += " ";
231 as.name += "SR:" + value;
235 m_audio.push_back(as);
242 printf("FPS: %f\n", m_fps);
243 printf("Duration: %lu frames\n",(unsigned long)m_duration);
244 printf("W/H: %ix%i\n",m_width, m_height);
245 printf("aspect: %f\n",m_aspect);
246 printf("codec: %s\n",m_codec.c_str());
247 if (m_audio.size() > 0) {
248 for (AudioStreams::iterator it = m_audio.begin(); it < m_audio.end(); ++it) {
249 printf("audio: %s - %i channels\n",(*it).stream_id.c_str(), (*it).channels);
252 printf("audio: no audio streams in file.\n");
259 TranscodeFfmpeg::FFSettings
260 TranscodeFfmpeg::default_encoder_settings ()
262 TranscodeFfmpeg::FFSettings ffs;
264 ffs["-vcodec"] = "mpeg4";
265 ffs["-acodec"] = "ac3";
266 ffs["-b:v"] = "5000k";
267 ffs["-b:a"] = "160k";
271 TranscodeFfmpeg::FFSettings
272 TranscodeFfmpeg::default_meta_data ()
274 TranscodeFfmpeg::FFSettings ffm;
276 ffm["comment"] = "Created with " PROGRAM_NAME;
281 TranscodeFfmpeg::format_metadata (std::string key, std::string value)
283 size_t start_pos = 0;
284 std::string v1 = value;
285 while((start_pos = v1.find_first_not_of(
286 "abcdefghijklmnopqrstuvwxyz ABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789(),.\"'",
287 start_pos)) != std::string::npos)
289 v1.replace(start_pos, 1, "_");
294 while((start_pos = v1.find("\"", start_pos)) != std::string::npos) {
295 v1.replace(start_pos, 1, "\\\"");
299 size_t len = key.length() + v1.length() + 4;
300 char *mds = (char*) calloc(len, sizeof(char));
301 snprintf(mds, len, "%s=\"%s\"", key.c_str(), v1.c_str());
306 TranscodeFfmpeg::encode (std::string outfile, std::string inf_a, std::string inf_v, TranscodeFfmpeg::FFSettings ffs, TranscodeFfmpeg::FFSettings meta, bool map)
308 #define MAX_FFMPEG_ENCODER_ARGS (100)
312 argp=(char**) calloc(MAX_FFMPEG_ENCODER_ARGS,sizeof(char*));
313 argp[a++] = strdup(ffmpeg_exe.c_str());
314 if (m_avoffset < 0 || m_avoffset > 0) {
315 std::ostringstream osstream; osstream << m_avoffset;
316 argp[a++] = strdup("-itsoffset");
317 argp[a++] = strdup(osstream.str().c_str());
319 argp[a++] = strdup("-i");
320 argp[a++] = strdup(inf_v.c_str());
322 argp[a++] = strdup("-i");
323 argp[a++] = strdup(inf_a.c_str());
325 for(TranscodeFfmpeg::FFSettings::const_iterator it = ffs.begin(); it != ffs.end(); ++it) {
326 argp[a++] = strdup(it->first.c_str());
327 argp[a++] = strdup(it->second.c_str());
329 for(TranscodeFfmpeg::FFSettings::const_iterator it = meta.begin(); it != meta.end(); ++it) {
330 argp[a++] = strdup("-metadata");
331 argp[a++] = format_metadata(it->first.c_str(), it->second.c_str());
335 m_lead_in = rint (m_lead_in * m_fps) / m_fps;
336 m_lead_out = rint (m_lead_out * m_fps) / m_fps;
339 if (m_lead_in != 0 && m_lead_out != 0) {
340 std::ostringstream osstream;
341 argp[a++] = strdup("-vf");
342 osstream << X_("color=c=black:s=") << m_width << X_("x") << m_height << X_(":d=") << m_lead_in;
343 if (!m_sar.empty()) osstream << X_(":sar=") << m_sar;
344 osstream << X_(" [pre]; ");
345 osstream << X_("color=c=black:s=") << m_width << X_("x") << m_height << X_(":d=") << m_lead_out;
346 if (!m_sar.empty()) osstream << X_(":sar=") << m_sar;
347 osstream << X_(" [post]; ");
348 osstream << X_("[pre] [in] [post] concat=n=3");
349 argp[a++] = strdup(osstream.str().c_str());
350 } else if (m_lead_in != 0) {
351 std::ostringstream osstream;
352 argp[a++] = strdup("-vf");
353 osstream << X_("color=c=black:s=") << m_width << X_("x") << m_height << X_(":d=") << m_lead_in;
354 if (!m_sar.empty()) osstream << X_(":sar=") << m_sar;
355 osstream << X_(" [pre]; ");
356 osstream << X_("[pre] [in] concat=n=2");
357 argp[a++] = strdup(osstream.str().c_str());
358 } else if (m_lead_out != 0) {
359 std::ostringstream osstream;
360 argp[a++] = strdup("-vf");
361 osstream << X_("color=c=black:s=") << m_width << X_("x") << m_height << X_(":d=") << m_lead_out;
362 if (!m_sar.empty()) osstream << X_(":sar=") << m_sar;
363 osstream << X_(" [post]; ");
364 osstream << X_("[in] [post] concat=n=2");
365 argp[a++] = strdup(osstream.str().c_str());
369 std::ostringstream osstream;
370 argp[a++] = strdup("-map");
371 osstream << X_("0:") << m_videoidx;
372 argp[a++] = strdup(osstream.str().c_str());
373 argp[a++] = strdup("-map");
374 argp[a++] = strdup("1:0");
377 argp[a++] = strdup("-y");
378 argp[a++] = strdup(outfile.c_str());
380 assert(a<MAX_FFMPEG_ENCODER_ARGS);
381 /* Note: these are free()d in ~SystemExec */
383 if (debug_enable) { /* tentative debug mode */
384 printf("EXPORT ENCODE:\n");
385 for (int i=0; i< a; ++i) {
386 printf("%s ", argp[i]);
392 ffcmd = new ARDOUR::SystemExec(ffmpeg_exe, argp);
393 ffcmd->ReadStdout.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffmpegparse_v, this, _1 ,_2));
394 ffcmd->Terminated.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffexit, this));
395 if (ffcmd->start(2)) {
403 TranscodeFfmpeg::extract_audio (std::string outfile, ARDOUR::framecnt_t /*samplerate*/, unsigned int stream)
405 if (!probeok) return false;
406 if (stream >= m_audio.size()) return false;
411 argp=(char**) calloc(15,sizeof(char*));
412 argp[i++] = strdup(ffmpeg_exe.c_str());
413 argp[i++] = strdup("-i");
414 argp[i++] = strdup(infile.c_str());
415 #if 0 /* ffmpeg write original samplerate, use a3/SRC to resample */
416 argp[i++] = strdup("-ar");
417 argp[i] = (char*) calloc(7,sizeof(char)); snprintf(argp[i++], 7, "%"PRId64, samplerate);
419 argp[i++] = strdup("-ac");
420 argp[i] = (char*) calloc(3,sizeof(char)); snprintf(argp[i++], 3, "%i", m_audio.at(stream).channels);
421 argp[i++] = strdup("-map");
422 argp[i] = (char*) calloc(8,sizeof(char)); snprintf(argp[i++], 8, "0:%s", m_audio.at(stream).stream_id.c_str());
423 argp[i++] = strdup("-vn");
424 argp[i++] = strdup("-acodec");
425 argp[i++] = strdup("pcm_f32le");
426 argp[i++] = strdup("-y");
427 argp[i++] = strdup(outfile.c_str());
428 argp[i++] = (char *)0;
429 /* Note: argp is free()d in ~SystemExec */
431 if (debug_enable) { /* tentative debug mode */
432 printf("EXTRACT AUDIO:\n");
433 for (int i=0; i< 14; ++i) {
434 printf("%s ", argp[i]);
440 ffcmd = new ARDOUR::SystemExec(ffmpeg_exe, argp);
441 ffcmd->ReadStdout.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffmpegparse_a, this, _1 ,_2));
442 ffcmd->Terminated.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffexit, this));
443 if (ffcmd->start(2)) {
452 TranscodeFfmpeg::transcode (std::string outfile, const int outw, const int outh, const int kbitps)
454 if (!probeok) return false;
457 int bitrate = kbitps;
461 if (width < 1 || width > m_width) { width = m_width; } /* don't allow upscaling */
462 if (height < 1 || height > m_height) { height = floor(width / m_aspect); }
465 const double bitperpixel = .7; /* avg quality */
466 bitrate = floor(m_fps * width * height * bitperpixel / 10000.0);
468 bitrate = bitrate / 10;
470 if (bitrate < 10) bitrate = 10;
471 if (bitrate > 1000) bitrate = 1000;
473 argp=(char**) calloc(16,sizeof(char*));
474 argp[0] = strdup(ffmpeg_exe.c_str());
475 argp[1] = strdup("-i");
476 argp[2] = strdup(infile.c_str());
477 argp[3] = strdup("-b:v");
478 argp[4] = (char*) calloc(7,sizeof(char)); snprintf(argp[4], 7, "%i0k", bitrate);
479 argp[5] = strdup("-s");
480 argp[6] = (char*) calloc(10,sizeof(char)); snprintf(argp[6], 10, "%ix%i", width, height);
481 argp[7] = strdup("-y");
482 argp[8] = strdup("-vcodec");
483 argp[9] = strdup("mjpeg");
484 argp[10] = strdup("-an");
485 argp[11] = strdup("-intra");
486 argp[12] = strdup("-g");
487 argp[13] = strdup("1");
488 argp[14] = strdup(outfile.c_str());
489 argp[15] = (char *)0;
490 /* Note: these are free()d in ~SystemExec */
492 if (debug_enable) { /* tentative debug mode */
493 printf("TRANSCODE VIDEO:\n");
494 for (int i=0; i< 15; ++i) {
495 printf("%s ", argp[i]);
500 ffcmd = new ARDOUR::SystemExec(ffmpeg_exe, argp);
501 ffcmd->ReadStdout.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffmpegparse_v, this, _1 ,_2));
502 ffcmd->Terminated.connect_same_thread (*this, boost::bind (&TranscodeFfmpeg::ffexit, this));
503 if (ffcmd->start(2)) {
511 TranscodeFfmpeg::cancel ()
513 if (!ffcmd || !ffcmd->is_running()) { return;}
514 ffcmd->write_to_stdin("q");
515 #ifdef PLATFORM_WINDOWS
526 TranscodeFfmpeg::ffexit ()
530 Finished(); /* EMIT SIGNAL */
534 TranscodeFfmpeg::ffprobeparse (std::string d, size_t /* s */)
540 TranscodeFfmpeg::ffmpegparse_a (std::string d, size_t /* s */)
543 int h,m,s; char f[7];
544 ARDOUR::framecnt_t p = -1;
546 if (!(t=strstr(d.c_str(), "time="))) { return; }
548 if (sscanf(t+5, "%d:%d:%d.%s",&h,&m,&s,f) == 4) {
549 p = (ARDOUR::framecnt_t) floor( 100.0 * (
553 + atoi(f) / pow((double)10, (int)strlen(f))
555 p = p * m_fps / 100.0;
556 if (p > m_duration ) { p = m_duration; }
557 Progress(p, m_duration); /* EMIT SIGNAL */
559 Progress(0, 0); /* EMIT SIGNAL */
564 TranscodeFfmpeg::ffmpegparse_v (std::string d, size_t /* s */)
566 if (strstr(d.c_str(), "ERROR") || strstr(d.c_str(), "Error") || strstr(d.c_str(), "error")) {
567 warning << "ffmpeg-error: " << d << endmsg;
569 if (strncmp(d.c_str(), "frame=",6)) {
572 d.erase(d.find_last_not_of(" \t\r\n") + 1);
573 printf("ffmpeg: '%s'\n", d.c_str());
576 Progress(0, 0); /* EMIT SIGNAL */
579 ARDOUR::framecnt_t f = atol(d.substr(6));
581 Progress(0, 0); /* EMIT SIGNAL */
583 Progress(f, m_duration); /* EMIT SIGNAL */