X-Git-Url: https://git.carlh.net/gitweb/?a=blobdiff_plain;f=src%2Fsubtitle_asset.cc;h=4deb366aa4921cf2bbfdb8c9b2a6f5d8e2287b0d;hb=dfc34502469e9c975bf78011b0efc365c11e9779;hp=9a3e3bbc9929b1302ab1d9ac8a6542a5eb5096a9;hpb=df6ed597b720399f02e7b75a7cf448d0956c89a1;p=libdcp.git diff --git a/src/subtitle_asset.cc b/src/subtitle_asset.cc index 9a3e3bbc..4deb366a 100644 --- a/src/subtitle_asset.cc +++ b/src/subtitle_asset.cc @@ -1,236 +1,919 @@ /* - Copyright (C) 2012 Carl Hetherington + Copyright (C) 2012-2021 Carl Hetherington - This program is free software; you can redistribute it and/or modify + This file is part of libdcp. + + libdcp is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. - This program is distributed in the hope that it will be useful, + libdcp is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License - along with this program; if not, write to the Free Software - Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. + along with libdcp. If not, see . + + In addition, as a special exception, the copyright holders give + permission to link the code of portions of this program with the + OpenSSL library under certain conditions as described in each + individual source file, and distribute linked combinations + including the two. + You must obey the GNU General Public License in all respects + for all of the code used other than OpenSSL. If you modify + file(s) with this exception, you may extend this exception to your + version of the file(s), but you are not obligated to do so. If you + do not wish to do so, delete this exception statement from your + version. If you delete this exception statement from all source + files in the program, then also delete it here. */ + +/** @file src/subtitle_asset.cc + * @brief SubtitleAsset class + */ + + +#include "compose.hpp" +#include "dcp_assert.h" +#include "load_font_node.h" +#include "raw_convert.h" +#include "reel_asset.h" #include "subtitle_asset.h" +#include "subtitle_asset_internal.h" +#include "subtitle_image.h" +#include "subtitle_string.h" +#include "util.h" +#include "xml.h" +#include +#include +#include +#include +#include +#include +#include -using namespace std; -using namespace boost; -using namespace libdcp; -SubtitleAsset::SubtitleAsset (string directory, string xml) - : Asset (directory, xml) - , XMLFile (path().string(), "DCSubtitle") +using std::cerr; +using std::cout; +using std::dynamic_pointer_cast; +using std::make_shared; +using std::map; +using std::pair; +using std::shared_ptr; +using std::string; +using std::vector; +using boost::lexical_cast; +using boost::optional; +using namespace dcp; + + +SubtitleAsset::SubtitleAsset () { - _subtitle_id = string_node ("SubtitleID"); - _movie_title = string_node ("MovieTitle"); - _reel_number = int64_node ("ReelNumber"); - _language = string_node ("Language"); - ignore_node ("LoadFont"); +} - list > font_nodes = sub_nodes ("Font"); - _load_font_nodes = sub_nodes ("LoadFont"); - /* Now make Subtitle objects to represent the raw XML nodes - in a sane way. - */ +SubtitleAsset::SubtitleAsset (boost::filesystem::path file) + : Asset (file) +{ + +} + + +string +string_attribute (xmlpp::Element const * node, string name) +{ + auto a = node->get_attribute (name); + if (!a) { + throw XMLError (String::compose ("missing attribute %1", name)); + } + return string (a->get_value ()); +} + + +optional +optional_string_attribute (xmlpp::Element const * node, string name) +{ + auto a = node->get_attribute (name); + if (!a) { + return {}; + } + return string (a->get_value ()); +} + + +optional +optional_bool_attribute (xmlpp::Element const * node, string name) +{ + auto s = optional_string_attribute (node, name); + if (!s) { + return {}; + } + + return (s.get() == "1" || s.get() == "yes"); +} + + +template +optional +optional_number_attribute (xmlpp::Element const * node, string name) +{ + auto s = optional_string_attribute (node, name); + if (!s) { + return boost::optional (); + } + + std::string t = s.get (); + boost::erase_all (t, " "); + return raw_convert (t); +} + - list > current_font_nodes; - for (list >::iterator i = font_nodes.begin(); i != font_nodes.end(); ++i) { - examine_font_node (*i, current_font_nodes); +SubtitleAsset::ParseState +SubtitleAsset::font_node_state (xmlpp::Element const * node, Standard standard) const +{ + ParseState ps; + + if (standard == Standard::INTEROP) { + ps.font_id = optional_string_attribute (node, "Id"); + } else { + ps.font_id = optional_string_attribute (node, "ID"); + } + ps.size = optional_number_attribute (node, "Size"); + ps.aspect_adjust = optional_number_attribute (node, "AspectAdjust"); + ps.italic = optional_bool_attribute (node, "Italic"); + ps.bold = optional_string_attribute(node, "Weight").get_value_or("normal") == "bold"; + if (standard == Standard::INTEROP) { + ps.underline = optional_bool_attribute (node, "Underlined"); + } else { + ps.underline = optional_bool_attribute (node, "Underline"); } + auto c = optional_string_attribute (node, "Color"); + if (c) { + ps.colour = Colour (c.get ()); + } + auto const e = optional_string_attribute (node, "Effect"); + if (e) { + ps.effect = string_to_effect (e.get ()); + } + c = optional_string_attribute (node, "EffectColor"); + if (c) { + ps.effect_colour = Colour (c.get ()); + } + + return ps; } void -SubtitleAsset::examine_font_node (shared_ptr font_node, list >& current_font_nodes) -{ - current_font_nodes.push_back (font_node); - - for (list >::iterator j = font_node->subtitle_nodes.begin(); j != font_node->subtitle_nodes.end(); ++j) { - for (list >::iterator k = (*j)->text_nodes.begin(); k != (*j)->text_nodes.end(); ++k) { - FontNode effective (current_font_nodes); - _subtitles.push_back ( - shared_ptr ( - new Subtitle ( - font_id_to_name (effective.id), - effective.italic.get(), - effective.color.get(), - effective.size, - (*j)->in, - (*j)->out, - (*k)->v_position, - (*k)->v_align, - (*k)->text, - effective.effect.get(), - effective.effect_color.get() - ) - ) - ); - } +SubtitleAsset::position_align (SubtitleAsset::ParseState& ps, xmlpp::Element const * node) const +{ + auto hp = optional_number_attribute (node, "HPosition"); + if (!hp) { + hp = optional_number_attribute (node, "Hposition"); + } + if (hp) { + ps.h_position = hp.get () / 100; } - for (list >::iterator j = font_node->font_nodes.begin(); j != font_node->font_nodes.end(); ++j) { - examine_font_node (*j, current_font_nodes); + auto ha = optional_string_attribute (node, "HAlign"); + if (!ha) { + ha = optional_string_attribute (node, "Halign"); + } + if (ha) { + ps.h_align = string_to_halign (ha.get ()); + } + + auto vp = optional_number_attribute (node, "VPosition"); + if (!vp) { + vp = optional_number_attribute (node, "Vposition"); + } + if (vp) { + ps.v_position = vp.get () / 100; } - current_font_nodes.pop_back (); + auto va = optional_string_attribute (node, "VAlign"); + if (!va) { + va = optional_string_attribute (node, "Valign"); + } + if (va) { + ps.v_align = string_to_valign (va.get ()); + } + + auto zp = optional_number_attribute(node, "Zposition"); + if (zp) { + ps.z_position = zp.get() / 100; + } } -FontNode::FontNode (xmlpp::Node const * node) - : XMLNode (node) + +SubtitleAsset::ParseState +SubtitleAsset::text_node_state (xmlpp::Element const * node) const { - id = optional_string_attribute ("Id"); - size = optional_int64_attribute ("Size"); - italic = optional_bool_attribute ("Italic"); - color = optional_color_attribute ("Color"); - string const e = optional_string_attribute ("Effect"); - if (e == "none") { - effect = NONE; - } else if (e == "border") { - effect = BORDER; - } else if (e == "shadow") { - effect = SHADOW; - } else if (!e.empty ()) { - throw DCPReadError ("unknown subtitle effect type"); + ParseState ps; + + position_align (ps, node); + + auto d = optional_string_attribute (node, "Direction"); + if (d) { + ps.direction = string_to_direction (d.get ()); } - effect_color = optional_color_attribute ("EffectColor"); - subtitle_nodes = sub_nodes ("Subtitle"); - font_nodes = sub_nodes ("Font"); + + ps.type = ParseState::Type::TEXT; + + return ps; } -FontNode::FontNode (list > const & font_nodes) - : size (0) - , italic (false) - , color ("FFFFFFFF") - , effect_color ("FFFFFFFF") + +SubtitleAsset::ParseState +SubtitleAsset::image_node_state (xmlpp::Element const * node) const { - for (list >::const_iterator i = font_nodes.begin(); i != font_nodes.end(); ++i) { - if (!(*i)->id.empty ()) { - id = (*i)->id; + ParseState ps; + + position_align (ps, node); + + ps.type = ParseState::Type::IMAGE; + + return ps; +} + + +SubtitleAsset::ParseState +SubtitleAsset::subtitle_node_state (xmlpp::Element const * node, optional tcr) const +{ + ParseState ps; + ps.in = Time (string_attribute(node, "TimeIn"), tcr); + ps.out = Time (string_attribute(node, "TimeOut"), tcr); + ps.fade_up_time = fade_time (node, "FadeUpTime", tcr); + ps.fade_down_time = fade_time (node, "FadeDownTime", tcr); + return ps; +} + + +Time +SubtitleAsset::fade_time (xmlpp::Element const * node, string name, optional tcr) const +{ + auto const u = optional_string_attribute(node, name).get_value_or (""); + Time t; + + if (u.empty ()) { + t = Time (0, 0, 0, 20, 250); + } else if (u.find (":") != string::npos) { + t = Time (u, tcr); + } else { + t = Time (0, 0, 0, lexical_cast (u), tcr.get_value_or(250)); + } + + if (t > Time (0, 0, 8, 0, 250)) { + t = Time (0, 0, 8, 0, 250); + } + + return t; +} + + +void +SubtitleAsset::parse_subtitles (xmlpp::Element const * node, vector& state, optional tcr, Standard standard) +{ + if (node->get_name() == "Font") { + state.push_back (font_node_state (node, standard)); + } else if (node->get_name() == "Subtitle") { + state.push_back (subtitle_node_state (node, tcr)); + } else if (node->get_name() == "Text") { + state.push_back (text_node_state (node)); + } else if (node->get_name() == "SubtitleList") { + state.push_back (ParseState ()); + } else if (node->get_name() == "Image") { + state.push_back (image_node_state (node)); + } else { + throw XMLError ("unexpected node " + node->get_name()); + } + + float space_before = 0; + + for (auto i: node->get_children()) { + auto const v = dynamic_cast(i); + if (v) { + maybe_add_subtitle (v->get_content(), state, space_before, standard); + space_before = 0; + } + auto const e = dynamic_cast(i); + if (e) { + if (e->get_name() == "Space") { + if (node->get_name() != "Text") { + throw XMLError ("Space node found outside Text"); + } + auto size = optional_string_attribute(e, "Size").get_value_or("0.5"); + if (standard == dcp::Standard::INTEROP) { + boost::replace_all(size, "em", ""); + } + space_before += raw_convert(size); + } else { + parse_subtitles (e, state, tcr, standard); + } + } + } + + state.pop_back (); +} + + +void +SubtitleAsset::maybe_add_subtitle (string text, vector const & parse_state, float space_before, Standard standard) +{ + auto wanted = [](ParseState const& ps) { + return ps.type && (ps.type.get() == ParseState::Type::TEXT || ps.type.get() == ParseState::Type::IMAGE); + }; + + if (find_if(parse_state.begin(), parse_state.end(), wanted) == parse_state.end()) { + return; + } + + ParseState ps; + for (auto const& i: parse_state) { + if (i.font_id) { + ps.font_id = i.font_id.get(); + } + if (i.size) { + ps.size = i.size.get(); + } + if (i.aspect_adjust) { + ps.aspect_adjust = i.aspect_adjust.get(); + } + if (i.italic) { + ps.italic = i.italic.get(); } - if ((*i)->size != 0) { - size = (*i)->size; + if (i.bold) { + ps.bold = i.bold.get(); } - if ((*i)->italic) { - italic = (*i)->italic.get (); + if (i.underline) { + ps.underline = i.underline.get(); } - if ((*i)->color) { - color = (*i)->color.get (); + if (i.colour) { + ps.colour = i.colour.get(); } - if ((*i)->effect) { - effect = (*i)->effect.get (); + if (i.effect) { + ps.effect = i.effect.get(); } - if ((*i)->effect_color) { - effect_color = (*i)->effect_color.get (); + if (i.effect_colour) { + ps.effect_colour = i.effect_colour.get(); } + if (i.h_position) { + ps.h_position = i.h_position.get(); + } + if (i.h_align) { + ps.h_align = i.h_align.get(); + } + if (i.v_position) { + ps.v_position = i.v_position.get(); + } + if (i.v_align) { + ps.v_align = i.v_align.get(); + } + if (i.z_position) { + ps.z_position = i.z_position.get(); + } + if (i.direction) { + ps.direction = i.direction.get(); + } + if (i.in) { + ps.in = i.in.get(); + } + if (i.out) { + ps.out = i.out.get(); + } + if (i.fade_up_time) { + ps.fade_up_time = i.fade_up_time.get(); + } + if (i.fade_down_time) { + ps.fade_down_time = i.fade_down_time.get(); + } + if (i.type) { + ps.type = i.type.get(); + } + } + + if (!ps.in || !ps.out) { + /* We're not in a node; just ignore this content */ + return; + } + + DCP_ASSERT (ps.type); + + switch (ps.type.get()) { + case ParseState::Type::TEXT: + _subtitles.push_back ( + make_shared( + ps.font_id, + ps.italic.get_value_or (false), + ps.bold.get_value_or (false), + ps.underline.get_value_or (false), + ps.colour.get_value_or (dcp::Colour (255, 255, 255)), + ps.size.get_value_or (42), + ps.aspect_adjust.get_value_or (1.0), + ps.in.get(), + ps.out.get(), + ps.h_position.get_value_or(0), + ps.h_align.get_value_or(HAlign::CENTER), + ps.v_position.get_value_or(0), + ps.v_align.get_value_or(VAlign::CENTER), + ps.z_position.get_value_or(0), + ps.direction.get_value_or (Direction::LTR), + text, + ps.effect.get_value_or (Effect::NONE), + ps.effect_colour.get_value_or (dcp::Colour (0, 0, 0)), + ps.fade_up_time.get_value_or(Time()), + ps.fade_down_time.get_value_or(Time()), + space_before + ) + ); + break; + case ParseState::Type::IMAGE: + { + switch (standard) { + case Standard::INTEROP: + if (text.size() >= 4) { + /* Remove file extension */ + text = text.substr(0, text.size() - 4); + } + break; + case Standard::SMPTE: + /* It looks like this urn:uuid: is required, but DoM wasn't expecting it (and not writing it) + * until around 2.15.140 so I guess either: + * a) it is not (always) used in the field, or + * b) nobody noticed / complained. + */ + if (text.substr(0, 9) == "urn:uuid:") { + text = text.substr(9); + } + break; + } + + /* Add a subtitle with no image data and we'll fill that in later */ + _subtitles.push_back ( + make_shared( + ArrayData(), + text, + ps.in.get(), + ps.out.get(), + ps.h_position.get_value_or(0), + ps.h_align.get_value_or(HAlign::CENTER), + ps.v_position.get_value_or(0), + ps.v_align.get_value_or(VAlign::CENTER), + ps.z_position.get_value_or(0), + ps.fade_up_time.get_value_or(Time()), + ps.fade_down_time.get_value_or(Time()) + ) + ); + break; + } } } -LoadFontNode::LoadFontNode (xmlpp::Node const * node) - : XMLNode (node) + +vector> +SubtitleAsset::subtitles () const { - id = string_attribute ("Id"); - uri = string_attribute ("URI"); + vector> s; + for (auto i: _subtitles) { + s.push_back (i); + } + return s; } - -SubtitleNode::SubtitleNode (xmlpp::Node const * node) - : XMLNode (node) + +vector> +SubtitleAsset::subtitles_during (Time from, Time to, bool starting) const { - in = time_attribute ("TimeIn"); - out = time_attribute ("TimeOut"); - text_nodes = sub_nodes ("Text"); + vector> s; + for (auto i: _subtitles) { + if ((starting && from <= i->in() && i->in() < to) || (!starting && i->out() >= from && i->in() <= to)) { + s.push_back (i); + } + } + + return s; } -TextNode::TextNode (xmlpp::Node const * node) - : XMLNode (node) - , v_align (CENTER) + +void +SubtitleAsset::add (shared_ptr s) { - text = content (); - v_position = float_attribute ("VPosition"); - string const v = optional_string_attribute ("VAlign"); - if (v == "top") { - v_align = TOP; - } else if (v == "center") { - v_align = CENTER; - } else if (v == "bottom") { - v_align = BOTTOM; - } + _subtitles.push_back (s); } -list > -SubtitleAsset::subtitles_at (Time t) const + +Time +SubtitleAsset::latest_subtitle_out () const { - list > s; - for (list >::const_iterator i = _subtitles.begin(); i != _subtitles.end(); ++i) { - if ((*i)->in() <= t && t <= (*i)->out ()) { - s.push_back (*i); + Time t; + for (auto i: _subtitles) { + if (i->out() > t) { + t = i->out (); } } - return s; + return t; } -std::string -SubtitleAsset::font_id_to_name (string id) const + +bool +SubtitleAsset::equals(shared_ptr other_asset, EqualityOptions const& options, NoteHandler note) const { - list >::const_iterator i = _load_font_nodes.begin(); - while (i != _load_font_nodes.end() && (*i)->id != id) { - ++i; + if (!Asset::equals (other_asset, options, note)) { + return false; } - if (i == _load_font_nodes.end ()) { - return ""; + auto other = dynamic_pointer_cast (other_asset); + if (!other) { + return false; } - if ((*i)->uri == "arial.ttf") { - return "Arial"; + if (_subtitles.size() != other->_subtitles.size()) { + note (NoteType::ERROR, String::compose("different number of subtitles: %1 vs %2", _subtitles.size(), other->_subtitles.size())); + return false; } - return ""; + auto i = _subtitles.begin(); + auto j = other->_subtitles.begin(); + + while (i != _subtitles.end()) { + auto string_i = dynamic_pointer_cast (*i); + auto string_j = dynamic_pointer_cast (*j); + auto image_i = dynamic_pointer_cast (*i); + auto image_j = dynamic_pointer_cast (*j); + + if ((string_i && !string_j) || (image_i && !image_j)) { + note (NoteType::ERROR, "subtitles differ: string vs. image"); + return false; + } + + if (string_i && !string_i->equals(string_j, options, note)) { + return false; + } + + if (image_i && !image_i->equals(image_j, options, note)) { + return false; + } + + ++i; + ++j; + } + + return true; } -Subtitle::Subtitle ( - string font, - bool italic, - Color color, - int size, - Time in, - Time out, - float v_position, - VAlign v_align, - string text, - Effect effect, - Color effect_color - ) - : _font (font) - , _italic (italic) - , _color (color) - , _size (size) - , _in (in) - , _out (out) - , _v_position (v_position) - , _v_align (v_align) - , _text (text) - , _effect (effect) - , _effect_color (effect_color) + +struct SubtitleSorter { + bool operator() (shared_ptr a, shared_ptr b) { + if (a->in() != b->in()) { + return a->in() < b->in(); + } + if (a->v_align() == VAlign::BOTTOM) { + return a->v_position() > b->v_position(); + } + return a->v_position() < b->v_position(); + } +}; + + +void +SubtitleAsset::pull_fonts (shared_ptr part) +{ + if (part->children.empty ()) { + return; + } + + /* Pull up from children */ + for (auto i: part->children) { + pull_fonts (i); + } + + if (part->parent) { + /* Establish the common font features that each of part's children have; + these features go into part's font. + */ + part->font = part->children.front()->font; + for (auto i: part->children) { + part->font.take_intersection (i->font); + } + + /* Remove common values from part's children's fonts */ + for (auto i: part->children) { + i->font.take_difference (part->font); + } + } + + /* Merge adjacent children with the same font */ + auto i = part->children.begin(); + vector> merged; + + while (i != part->children.end()) { + + if ((*i)->font.empty ()) { + merged.push_back (*i); + ++i; + } else { + auto j = i; + ++j; + while (j != part->children.end() && (*i)->font == (*j)->font) { + ++j; + } + if (std::distance (i, j) == 1) { + merged.push_back (*i); + ++i; + } else { + shared_ptr group (new order::Part (part, (*i)->font)); + for (auto k = i; k != j; ++k) { + (*k)->font.clear (); + group->children.push_back (*k); + } + merged.push_back (group); + i = j; + } + } + } + part->children = merged; } -int -Subtitle::size_in_pixels (int screen_height) const + +/** @param standard Standard (INTEROP or SMPTE); this is used rather than putting things in the child + * class because the differences between the two are fairly subtle. + */ +void +SubtitleAsset::subtitles_as_xml (xmlpp::Element* xml_root, int time_code_rate, Standard standard) const { - /* Size in the subtitle file is given in points as if the screen - height is 11 inches, so a 72pt font would be 1/11th of the screen - height. + auto sorted = _subtitles; + std::stable_sort(sorted.begin(), sorted.end(), SubtitleSorter()); + + /* Gather our subtitles into a hierarchy of Subtitle/Text/String objects, writing + font information into the bottom level (String) objects. */ - - return _size * screen_height / (11 * 72); + + auto root = make_shared(shared_ptr()); + shared_ptr subtitle; + shared_ptr text; + + Time last_in; + Time last_out; + Time last_fade_up_time; + Time last_fade_down_time; + HAlign last_h_align; + float last_h_position; + VAlign last_v_align; + float last_v_position; + float last_z_position; + Direction last_direction; + + for (auto i: sorted) { + if (!subtitle || + (last_in != i->in() || + last_out != i->out() || + last_fade_up_time != i->fade_up_time() || + last_fade_down_time != i->fade_down_time()) + ) { + + subtitle = make_shared(root, i->in(), i->out(), i->fade_up_time(), i->fade_down_time()); + root->children.push_back (subtitle); + + last_in = i->in (); + last_out = i->out (); + last_fade_up_time = i->fade_up_time (); + last_fade_down_time = i->fade_down_time (); + text.reset (); + } + + auto is = dynamic_pointer_cast(i); + if (is) { + if (!text || + last_h_align != is->h_align() || + fabs(last_h_position - is->h_position()) > ALIGN_EPSILON || + last_v_align != is->v_align() || + fabs(last_v_position - is->v_position()) > ALIGN_EPSILON || + fabs(last_z_position - is->z_position()) > ALIGN_EPSILON || + last_direction != is->direction() + ) { + text = make_shared(subtitle, is->h_align(), is->h_position(), is->v_align(), is->v_position(), is->z_position(), is->direction()); + subtitle->children.push_back (text); + + last_h_align = is->h_align (); + last_h_position = is->h_position (); + last_v_align = is->v_align (); + last_v_position = is->v_position (); + last_z_position = is->z_position(); + last_direction = is->direction (); + } + + text->children.push_back (make_shared(text, order::Font (is, standard), is->text(), is->space_before())); + } + + auto ii = dynamic_pointer_cast(i); + if (ii) { + text.reset (); + subtitle->children.push_back ( + make_shared(subtitle, ii->id(), ii->png_image(), ii->h_align(), ii->h_position(), ii->v_align(), ii->v_position(), ii->z_position()) + ); + } + } + + /* Pull font changes as high up the hierarchy as we can */ + + pull_fonts (root); + + /* Write XML */ + + order::Context context; + context.time_code_rate = time_code_rate; + context.standard = standard; + context.spot_number = 1; + + root->write_xml (xml_root, context); +} + + +map +SubtitleAsset::font_data () const +{ + map out; + for (auto const& i: _fonts) { + out[i.load_id] = i.data; + } + return out; } + + +map +SubtitleAsset::font_filenames () const +{ + map out; + for (auto const& i: _fonts) { + if (i.file) { + out[i.load_id] = *i.file; + } + } + return out; +} + + +/** Replace empty IDs in any and tags with + * a dummy string. Some systems give errors with empty font IDs + * (see DCP-o-matic bug #1689). + */ +void +SubtitleAsset::fix_empty_font_ids () +{ + bool have_empty = false; + vector ids; + for (auto i: load_font_nodes()) { + if (i->id == "") { + have_empty = true; + } else { + ids.push_back (i->id); + } + } + + if (!have_empty) { + return; + } + + string const empty_id = unique_string (ids, "font"); + + for (auto i: load_font_nodes()) { + if (i->id == "") { + i->id = empty_id; + } + } + + for (auto i: _subtitles) { + auto j = dynamic_pointer_cast (i); + if (j && j->font() && j->font().get() == "") { + j->set_font (empty_id); + } + } +} + + +namespace { + +struct State +{ + int indent; + string xml; + int disable_formatting; +}; + +} + + +static +void +format_xml_node (xmlpp::Node const* node, State& state) +{ + if (auto text_node = dynamic_cast(node)) { + string content = text_node->get_content(); + boost::replace_all(content, "&", "&"); + boost::replace_all(content, "<", "<"); + boost::replace_all(content, ">", ">"); + state.xml += content; + } else if (auto element = dynamic_cast(node)) { + ++state.indent; + + auto children = element->get_children(); + auto const should_disable_formatting = + std::any_of( + children.begin(), children.end(), + [](xmlpp::Node const* node) { return static_cast(dynamic_cast(node)); } + ) || element->get_name() == "Text"; + + if (!state.disable_formatting) { + state.xml += "\n" + string(state.indent * 2, ' '); + } + + state.xml += "<" + element->get_name(); + + for (auto attribute: element->get_attributes()) { + state.xml += String::compose(" %1=\"%2\"", attribute->get_name().raw(), attribute->get_value().raw()); + } + + if (children.empty()) { + state.xml += "/>"; + } else { + state.xml += ">"; + + if (should_disable_formatting) { + ++state.disable_formatting; + } + + for (auto child: children) { + format_xml_node(child, state); + } + + if (!state.disable_formatting) { + state.xml += "\n" + string(state.indent * 2, ' '); + } + + state.xml += String::compose("", element->get_name().raw()); + + if (should_disable_formatting) { + --state.disable_formatting; + } + } + + --state.indent; + } +} + + +/** Format XML much as write_to_string_formatted() would do, except without adding any white space + * to nodes. This is an attempt to avoid changing what is actually displayed as subtitles + * while also formatting the XML in such a way as to avoid DoM bug 2205. + * + * xml_namespace is an optional namespace for the root node; it would be nicer to set this up with + * set_namespace_declaration in the caller and then to extract it here but I couldn't find a way + * to get all namespaces with the libxml++ API. + */ +string +SubtitleAsset::format_xml(xmlpp::Document const& document, optional> xml_namespace) +{ + auto root = document.get_root_node(); + + State state = {}; + state.xml = "\n<" + root->get_name(); + + if (xml_namespace) { + if (xml_namespace->first.empty()) { + state.xml += String::compose(" xmlns=\"%1\"", xml_namespace->second); + } else { + state.xml += String::compose(" xmlns:%1=\"%2\"", xml_namespace->first, xml_namespace->second); + } + } + + for (auto attribute: root->get_attributes()) { + state.xml += String::compose(" %1=\"%2\"", attribute->get_name().raw(), attribute->get_value().raw()); + } + + state.xml += ">"; + + for (auto child: document.get_root_node()->get_children()) { + format_xml_node(child, state); + } + + state.xml += String::compose("\n\n", root->get_name().raw()); + + return state.xml; +} + + +void +SubtitleAsset::ensure_font(string load_id, dcp::ArrayData data) +{ + if (std::find_if(_fonts.begin(), _fonts.end(), [load_id](Font const& font) { return font.load_id == load_id; }) == _fonts.end()) { + add_font(load_id, data); + } +} +