2 Copyright (C) 2018-2021 Carl Hetherington <cth@carlh.net>
4 This file is part of libdcp.
6 libdcp is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2 of the License, or
9 (at your option) any later version.
11 libdcp is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with libdcp. If not, see <http://www.gnu.org/licenses/>.
19 In addition, as a special exception, the copyright holders give
20 permission to link the code of portions of this program with the
21 OpenSSL library under certain conditions as described in each
22 individual source file, and distribute linked combinations
25 You must obey the GNU General Public License in all respects
26 for all of the code used other than OpenSSL. If you modify
27 file(s) with this exception, you may extend this exception to your
28 version of the file(s), but you are not obligated to do so. If you
29 do not wish to do so, delete this exception statement from your
30 version. If you delete this exception statement from all source
31 files in the program, then also delete it here.
35 /** @file src/verify.cc
36 * @brief dcp::verify() method and associated code
40 #include "compose.hpp"
43 #include "exceptions.h"
44 #include "interop_subtitle_asset.h"
45 #include "mono_picture_asset.h"
46 #include "mono_picture_frame.h"
47 #include "raw_convert.h"
49 #include "reel_closed_caption_asset.h"
50 #include "reel_interop_subtitle_asset.h"
51 #include "reel_markers_asset.h"
52 #include "reel_picture_asset.h"
53 #include "reel_sound_asset.h"
54 #include "reel_smpte_subtitle_asset.h"
55 #include "reel_subtitle_asset.h"
56 #include "smpte_subtitle_asset.h"
57 #include "stereo_picture_asset.h"
58 #include "stereo_picture_frame.h"
60 #include "verify_j2k.h"
61 #include <xercesc/dom/DOMAttr.hpp>
62 #include <xercesc/dom/DOMDocument.hpp>
63 #include <xercesc/dom/DOMError.hpp>
64 #include <xercesc/dom/DOMErrorHandler.hpp>
65 #include <xercesc/dom/DOMException.hpp>
66 #include <xercesc/dom/DOMImplementation.hpp>
67 #include <xercesc/dom/DOMImplementationLS.hpp>
68 #include <xercesc/dom/DOMImplementationRegistry.hpp>
69 #include <xercesc/dom/DOMLSParser.hpp>
70 #include <xercesc/dom/DOMLocator.hpp>
71 #include <xercesc/dom/DOMNamedNodeMap.hpp>
72 #include <xercesc/dom/DOMNodeList.hpp>
73 #include <xercesc/framework/LocalFileInputSource.hpp>
74 #include <xercesc/framework/MemBufInputSource.hpp>
75 #include <xercesc/parsers/AbstractDOMParser.hpp>
76 #include <xercesc/parsers/XercesDOMParser.hpp>
77 #include <xercesc/sax/HandlerBase.hpp>
78 #include <xercesc/util/PlatformUtils.hpp>
79 #include <boost/algorithm/string.hpp>
91 using std::shared_ptr;
92 using std::make_shared;
93 using boost::optional;
94 using boost::function;
95 using std::dynamic_pointer_cast;
99 using namespace xercesc;
104 xml_ch_to_string (XMLCh const * a)
106 char* x = XMLString::transcode(a);
108 XMLString::release(&x);
113 class XMLValidationError
116 XMLValidationError (SAXParseException const & e)
117 : _message (xml_ch_to_string(e.getMessage()))
118 , _line (e.getLineNumber())
119 , _column (e.getColumnNumber())
120 , _public_id (e.getPublicId() ? xml_ch_to_string(e.getPublicId()) : "")
121 , _system_id (e.getSystemId() ? xml_ch_to_string(e.getSystemId()) : "")
126 string message () const {
130 uint64_t line () const {
134 uint64_t column () const {
138 string public_id () const {
142 string system_id () const {
155 class DCPErrorHandler : public ErrorHandler
158 void warning(const SAXParseException& e) override
160 maybe_add (XMLValidationError(e));
163 void error(const SAXParseException& e) override
165 maybe_add (XMLValidationError(e));
168 void fatalError(const SAXParseException& e) override
170 maybe_add (XMLValidationError(e));
173 void resetErrors() override {
177 list<XMLValidationError> errors () const {
182 void maybe_add (XMLValidationError e)
184 /* XXX: nasty hack */
186 e.message().find("schema document") != string::npos &&
187 e.message().find("has different target namespace from the one specified in instance document") != string::npos
192 _errors.push_back (e);
195 list<XMLValidationError> _errors;
202 StringToXMLCh (string a)
204 _buffer = XMLString::transcode(a.c_str());
207 StringToXMLCh (StringToXMLCh const&) = delete;
208 StringToXMLCh& operator= (StringToXMLCh const&) = delete;
212 XMLString::release (&_buffer);
215 XMLCh const * get () const {
224 class LocalFileResolver : public EntityResolver
227 LocalFileResolver (boost::filesystem::path xsd_dtd_directory)
228 : _xsd_dtd_directory (xsd_dtd_directory)
230 /* XXX: I'm not clear on what things need to be in this list; some XSDs are apparently, magically
231 * found without being here.
233 add("http://www.w3.org/2001/XMLSchema.dtd", "XMLSchema.dtd");
234 add("http://www.w3.org/2001/03/xml.xsd", "xml.xsd");
235 add("http://www.w3.org/TR/2002/REC-xmldsig-core-20020212/xmldsig-core-schema.xsd", "xmldsig-core-schema.xsd");
236 add("http://www.digicine.com/schemas/437-Y/2007/Main-Stereo-Picture-CPL.xsd", "Main-Stereo-Picture-CPL.xsd");
237 add("http://www.digicine.com/PROTO-ASDCP-CPL-20040511.xsd", "PROTO-ASDCP-CPL-20040511.xsd");
238 add("http://www.digicine.com/PROTO-ASDCP-PKL-20040311.xsd", "PROTO-ASDCP-PKL-20040311.xsd");
239 add("http://www.digicine.com/PROTO-ASDCP-AM-20040311.xsd", "PROTO-ASDCP-AM-20040311.xsd");
240 add("http://www.digicine.com/PROTO-ASDCP-CC-CPL-20070926#", "PROTO-ASDCP-CC-CPL-20070926.xsd");
241 add("interop-subs", "DCSubtitle.v1.mattsson.xsd");
242 add("http://www.smpte-ra.org/schemas/428-7/2010/DCST.xsd", "SMPTE-428-7-2010-DCST.xsd");
243 add("http://www.smpte-ra.org/schemas/429-16/2014/CPL-Metadata", "SMPTE-429-16.xsd");
244 add("http://www.dolby.com/schemas/2012/AD", "Dolby-2012-AD.xsd");
245 add("http://www.smpte-ra.org/schemas/429-10/2008/Main-Stereo-Picture-CPL", "SMPTE-429-10-2008.xsd");
248 InputSource* resolveEntity(XMLCh const *, XMLCh const * system_id) override
253 auto system_id_str = xml_ch_to_string (system_id);
254 auto p = _xsd_dtd_directory;
255 if (_files.find(system_id_str) == _files.end()) {
258 p /= _files[system_id_str];
260 StringToXMLCh ch (p.string());
261 return new LocalFileInputSource(ch.get());
265 void add (string uri, string file)
270 std::map<string, string> _files;
271 boost::filesystem::path _xsd_dtd_directory;
276 parse (XercesDOMParser& parser, boost::filesystem::path xml)
278 parser.parse(xml.string().c_str());
283 parse (XercesDOMParser& parser, string xml)
285 xercesc::MemBufInputSource buf(reinterpret_cast<unsigned char const*>(xml.c_str()), xml.size(), "");
292 validate_xml (T xml, boost::filesystem::path xsd_dtd_directory, vector<VerificationNote>& notes)
295 XMLPlatformUtils::Initialize ();
296 } catch (XMLException& e) {
297 throw MiscError ("Failed to initialise xerces library");
300 DCPErrorHandler error_handler;
302 /* All the xerces objects in this scope must be destroyed before XMLPlatformUtils::Terminate() is called */
304 XercesDOMParser parser;
305 parser.setValidationScheme(XercesDOMParser::Val_Always);
306 parser.setDoNamespaces(true);
307 parser.setDoSchema(true);
309 vector<string> schema;
310 schema.push_back("xml.xsd");
311 schema.push_back("xmldsig-core-schema.xsd");
312 schema.push_back("SMPTE-429-7-2006-CPL.xsd");
313 schema.push_back("SMPTE-429-8-2006-PKL.xsd");
314 schema.push_back("SMPTE-429-9-2007-AM.xsd");
315 schema.push_back("Main-Stereo-Picture-CPL.xsd");
316 schema.push_back("PROTO-ASDCP-CPL-20040511.xsd");
317 schema.push_back("PROTO-ASDCP-PKL-20040311.xsd");
318 schema.push_back("PROTO-ASDCP-AM-20040311.xsd");
319 schema.push_back("DCSubtitle.v1.mattsson.xsd");
320 schema.push_back("DCDMSubtitle-2010.xsd");
321 schema.push_back("PROTO-ASDCP-CC-CPL-20070926.xsd");
322 schema.push_back("SMPTE-429-16.xsd");
323 schema.push_back("Dolby-2012-AD.xsd");
324 schema.push_back("SMPTE-429-10-2008.xsd");
325 schema.push_back("xlink.xsd");
326 schema.push_back("SMPTE-335-2012.xsd");
327 schema.push_back("SMPTE-395-2014-13-1-aaf.xsd");
328 schema.push_back("isdcf-mca.xsd");
329 schema.push_back("SMPTE-429-12-2008.xsd");
331 /* XXX: I'm not especially clear what this is for, but it seems to be necessary.
332 * Schemas that are not mentioned in this list are not read, and the things
333 * they describe are not checked.
336 for (auto i: schema) {
337 locations += String::compose("%1 %1 ", i, i);
340 parser.setExternalSchemaLocation(locations.c_str());
341 parser.setValidationSchemaFullChecking(true);
342 parser.setErrorHandler(&error_handler);
344 LocalFileResolver resolver (xsd_dtd_directory);
345 parser.setEntityResolver(&resolver);
348 parser.resetDocumentPool();
350 } catch (XMLException& e) {
351 throw MiscError(xml_ch_to_string(e.getMessage()));
352 } catch (DOMException& e) {
353 throw MiscError(xml_ch_to_string(e.getMessage()));
355 throw MiscError("Unknown exception from xerces");
359 XMLPlatformUtils::Terminate ();
361 for (auto i: error_handler.errors()) {
363 VerificationNote::Type::ERROR,
364 VerificationNote::Code::INVALID_XML,
366 boost::trim_copy(i.public_id() + " " + i.system_id()),
373 enum class VerifyAssetResult {
380 static VerifyAssetResult
381 verify_asset (shared_ptr<const DCP> dcp, shared_ptr<const ReelFileAsset> reel_file_asset, function<void (float)> progress)
383 auto const actual_hash = reel_file_asset->asset_ref()->hash(progress);
385 auto pkls = dcp->pkls();
386 /* We've read this DCP in so it must have at least one PKL */
387 DCP_ASSERT (!pkls.empty());
389 auto asset = reel_file_asset->asset_ref().asset();
391 optional<string> pkl_hash;
393 pkl_hash = i->hash (reel_file_asset->asset_ref()->id());
399 DCP_ASSERT (pkl_hash);
401 auto cpl_hash = reel_file_asset->hash();
402 if (cpl_hash && *cpl_hash != *pkl_hash) {
403 return VerifyAssetResult::CPL_PKL_DIFFER;
406 if (actual_hash != *pkl_hash) {
407 return VerifyAssetResult::BAD;
410 return VerifyAssetResult::GOOD;
415 verify_language_tag (string tag, vector<VerificationNote>& notes)
418 LanguageTag test (tag);
419 } catch (LanguageTagError &) {
420 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_LANGUAGE, tag});
426 verify_picture_asset (shared_ptr<const ReelFileAsset> reel_file_asset, boost::filesystem::path file, vector<VerificationNote>& notes, function<void (float)> progress)
428 int biggest_frame = 0;
429 auto asset = dynamic_pointer_cast<PictureAsset>(reel_file_asset->asset_ref().asset());
430 auto const duration = asset->intrinsic_duration ();
432 auto check_and_add = [¬es](vector<VerificationNote> const& j2k_notes) {
433 for (auto i: j2k_notes) {
434 if (find(notes.begin(), notes.end(), i) == notes.end()) {
440 if (auto mono_asset = dynamic_pointer_cast<MonoPictureAsset>(reel_file_asset->asset_ref().asset())) {
441 auto reader = mono_asset->start_read ();
442 for (int64_t i = 0; i < duration; ++i) {
443 auto frame = reader->get_frame (i);
444 biggest_frame = max(biggest_frame, frame->size());
445 if (!mono_asset->encrypted() || mono_asset->key()) {
446 vector<VerificationNote> j2k_notes;
447 verify_j2k (frame, j2k_notes);
448 check_and_add (j2k_notes);
450 progress (float(i) / duration);
452 } else if (auto stereo_asset = dynamic_pointer_cast<StereoPictureAsset>(asset)) {
453 auto reader = stereo_asset->start_read ();
454 for (int64_t i = 0; i < duration; ++i) {
455 auto frame = reader->get_frame (i);
456 biggest_frame = max(biggest_frame, max(frame->left()->size(), frame->right()->size()));
457 if (!stereo_asset->encrypted() || mono_asset->key()) {
458 vector<VerificationNote> j2k_notes;
459 verify_j2k (frame->left(), j2k_notes);
460 verify_j2k (frame->right(), j2k_notes);
461 check_and_add (j2k_notes);
463 progress (float(i) / duration);
468 static const int max_frame = rint(250 * 1000000 / (8 * asset->edit_rate().as_float()));
469 static const int risky_frame = rint(230 * 1000000 / (8 * asset->edit_rate().as_float()));
470 if (biggest_frame > max_frame) {
472 VerificationNote::Type::ERROR, VerificationNote::Code::INVALID_PICTURE_FRAME_SIZE_IN_BYTES, file
474 } else if (biggest_frame > risky_frame) {
476 VerificationNote::Type::WARNING, VerificationNote::Code::NEARLY_INVALID_PICTURE_FRAME_SIZE_IN_BYTES, file
483 verify_main_picture_asset (
484 shared_ptr<const DCP> dcp,
485 shared_ptr<const ReelPictureAsset> reel_asset,
486 function<void (string, optional<boost::filesystem::path>)> stage,
487 function<void (float)> progress,
488 vector<VerificationNote>& notes
491 auto asset = reel_asset->asset();
492 auto const file = *asset->file();
493 stage ("Checking picture asset hash", file);
494 auto const r = verify_asset (dcp, reel_asset, progress);
496 case VerifyAssetResult::BAD:
498 VerificationNote::Type::ERROR, VerificationNote::Code::INCORRECT_PICTURE_HASH, file
501 case VerifyAssetResult::CPL_PKL_DIFFER:
503 VerificationNote::Type::ERROR, VerificationNote::Code::MISMATCHED_PICTURE_HASHES, file
509 stage ("Checking picture frame sizes", asset->file());
510 verify_picture_asset (reel_asset, file, notes, progress);
512 /* Only flat/scope allowed by Bv2.1 */
514 asset->size() != Size(2048, 858) &&
515 asset->size() != Size(1998, 1080) &&
516 asset->size() != Size(4096, 1716) &&
517 asset->size() != Size(3996, 2160)) {
519 VerificationNote::Type::BV21_ERROR,
520 VerificationNote::Code::INVALID_PICTURE_SIZE_IN_PIXELS,
521 String::compose("%1x%2", asset->size().width, asset->size().height),
526 /* Only 24, 25, 48fps allowed for 2K */
528 (asset->size() == Size(2048, 858) || asset->size() == Size(1998, 1080)) &&
529 (asset->edit_rate() != Fraction(24, 1) && asset->edit_rate() != Fraction(25, 1) && asset->edit_rate() != Fraction(48, 1))
532 VerificationNote::Type::BV21_ERROR,
533 VerificationNote::Code::INVALID_PICTURE_FRAME_RATE_FOR_2K,
534 String::compose("%1/%2", asset->edit_rate().numerator, asset->edit_rate().denominator),
539 if (asset->size() == Size(4096, 1716) || asset->size() == Size(3996, 2160)) {
540 /* Only 24fps allowed for 4K */
541 if (asset->edit_rate() != Fraction(24, 1)) {
543 VerificationNote::Type::BV21_ERROR,
544 VerificationNote::Code::INVALID_PICTURE_FRAME_RATE_FOR_4K,
545 String::compose("%1/%2", asset->edit_rate().numerator, asset->edit_rate().denominator),
550 /* Only 2D allowed for 4K */
551 if (dynamic_pointer_cast<const StereoPictureAsset>(asset)) {
553 VerificationNote::Type::BV21_ERROR,
554 VerificationNote::Code::INVALID_PICTURE_ASSET_RESOLUTION_FOR_3D,
555 String::compose("%1/%2", asset->edit_rate().numerator, asset->edit_rate().denominator),
566 verify_main_sound_asset (
567 shared_ptr<const DCP> dcp,
568 shared_ptr<const ReelSoundAsset> reel_asset,
569 function<void (string, optional<boost::filesystem::path>)> stage,
570 function<void (float)> progress,
571 vector<VerificationNote>& notes
574 auto asset = reel_asset->asset();
575 stage ("Checking sound asset hash", asset->file());
576 auto const r = verify_asset (dcp, reel_asset, progress);
578 case VerifyAssetResult::BAD:
579 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::INCORRECT_SOUND_HASH, *asset->file()});
581 case VerifyAssetResult::CPL_PKL_DIFFER:
582 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::MISMATCHED_SOUND_HASHES, *asset->file()});
588 stage ("Checking sound asset metadata", asset->file());
590 if (auto lang = asset->language()) {
591 verify_language_tag (*lang, notes);
593 if (asset->sampling_rate() != 48000) {
594 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_SOUND_FRAME_RATE, raw_convert<string>(asset->sampling_rate()), *asset->file()});
600 verify_main_subtitle_reel (shared_ptr<const ReelSubtitleAsset> reel_asset, vector<VerificationNote>& notes)
602 /* XXX: is Language compulsory? */
603 if (reel_asset->language()) {
604 verify_language_tag (*reel_asset->language(), notes);
607 if (!reel_asset->entry_point()) {
608 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_SUBTITLE_ENTRY_POINT, reel_asset->id() });
609 } else if (reel_asset->entry_point().get()) {
610 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INCORRECT_SUBTITLE_ENTRY_POINT, reel_asset->id() });
616 verify_closed_caption_reel (shared_ptr<const ReelClosedCaptionAsset> reel_asset, vector<VerificationNote>& notes)
618 /* XXX: is Language compulsory? */
619 if (reel_asset->language()) {
620 verify_language_tag (*reel_asset->language(), notes);
623 if (!reel_asset->entry_point()) {
624 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_CLOSED_CAPTION_ENTRY_POINT, reel_asset->id() });
625 } else if (reel_asset->entry_point().get()) {
626 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INCORRECT_CLOSED_CAPTION_ENTRY_POINT, reel_asset->id() });
633 boost::optional<string> subtitle_language;
637 /** Verify stuff that is common to both subtitles and closed captions */
639 verify_smpte_timed_text_asset (
640 shared_ptr<const SMPTESubtitleAsset> asset,
641 optional<int64_t> reel_asset_duration,
642 vector<VerificationNote>& notes
645 if (asset->language()) {
646 verify_language_tag (*asset->language(), notes);
648 notes.push_back ({ VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_SUBTITLE_LANGUAGE, *asset->file() });
651 auto const size = boost::filesystem::file_size(asset->file().get());
652 if (size > 115 * 1024 * 1024) {
654 { VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_TIMED_TEXT_SIZE_IN_BYTES, raw_convert<string>(size), *asset->file() }
658 /* XXX: I'm not sure what Bv2.1_7.2.1 means when it says "the font resource shall not be larger than 10MB"
659 * but I'm hoping that checking for the total size of all fonts being <= 10MB will do.
661 auto fonts = asset->font_data ();
663 for (auto i: fonts) {
664 total_size += i.second.size();
666 if (total_size > 10 * 1024 * 1024) {
667 notes.push_back ({ VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_TIMED_TEXT_FONT_SIZE_IN_BYTES, raw_convert<string>(total_size), asset->file().get() });
670 if (!asset->start_time()) {
671 notes.push_back ({ VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_SUBTITLE_START_TIME, asset->file().get() });
672 } else if (asset->start_time() != Time()) {
673 notes.push_back ({ VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_SUBTITLE_START_TIME, asset->file().get() });
676 if (reel_asset_duration && *reel_asset_duration != asset->intrinsic_duration()) {
679 VerificationNote::Type::BV21_ERROR,
680 VerificationNote::Code::MISMATCHED_TIMED_TEXT_DURATION,
681 String::compose("%1 %2", *reel_asset_duration, asset->intrinsic_duration()),
688 /** Verify SMPTE subtitle-only stuff */
690 verify_smpte_subtitle_asset (
691 shared_ptr<const SMPTESubtitleAsset> asset,
692 vector<VerificationNote>& notes,
696 if (asset->language()) {
697 if (!state.subtitle_language) {
698 state.subtitle_language = *asset->language();
699 } else if (state.subtitle_language != *asset->language()) {
700 notes.push_back ({ VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISMATCHED_SUBTITLE_LANGUAGES });
704 DCP_ASSERT (asset->resource_id());
705 auto xml_id = asset->xml_id();
707 if (asset->resource_id().get() != xml_id) {
708 notes.push_back ({ VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISMATCHED_TIMED_TEXT_RESOURCE_ID });
711 if (asset->id() == asset->resource_id().get() || asset->id() == xml_id) {
712 notes.push_back ({ VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INCORRECT_TIMED_TEXT_ASSET_ID });
715 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISSED_CHECK_OF_ENCRYPTED});
720 /** Verify all subtitle stuff */
722 verify_subtitle_asset (
723 shared_ptr<const SubtitleAsset> asset,
724 optional<int64_t> reel_asset_duration,
725 function<void (string, optional<boost::filesystem::path>)> stage,
726 boost::filesystem::path xsd_dtd_directory,
727 vector<VerificationNote>& notes,
731 stage ("Checking subtitle XML", asset->file());
732 /* Note: we must not use SubtitleAsset::xml_as_string() here as that will mean the data on disk
733 * gets passed through libdcp which may clean up and therefore hide errors.
735 if (asset->raw_xml()) {
736 validate_xml (asset->raw_xml().get(), xsd_dtd_directory, notes);
738 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISSED_CHECK_OF_ENCRYPTED});
741 auto smpte = dynamic_pointer_cast<const SMPTESubtitleAsset>(asset);
743 verify_smpte_timed_text_asset (smpte, reel_asset_duration, notes);
744 verify_smpte_subtitle_asset (smpte, notes, state);
749 /** Verify all closed caption stuff */
751 verify_closed_caption_asset (
752 shared_ptr<const SubtitleAsset> asset,
753 optional<int64_t> reel_asset_duration,
754 function<void (string, optional<boost::filesystem::path>)> stage,
755 boost::filesystem::path xsd_dtd_directory,
756 vector<VerificationNote>& notes
759 stage ("Checking closed caption XML", asset->file());
760 /* Note: we must not use SubtitleAsset::xml_as_string() here as that will mean the data on disk
761 * gets passed through libdcp which may clean up and therefore hide errors.
763 auto raw_xml = asset->raw_xml();
765 validate_xml (*raw_xml, xsd_dtd_directory, notes);
766 if (raw_xml->size() > 256 * 1024) {
767 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_CLOSED_CAPTION_XML_SIZE_IN_BYTES, raw_convert<string>(raw_xml->size()), *asset->file()});
770 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISSED_CHECK_OF_ENCRYPTED});
773 auto smpte = dynamic_pointer_cast<const SMPTESubtitleAsset>(asset);
775 verify_smpte_timed_text_asset (smpte, reel_asset_duration, notes);
780 /** Check the timing of the individual subtitles and make sure there are no empty <Text> nodes */
783 verify_text_details (
784 vector<shared_ptr<Reel>> reels,
786 vector<VerificationNote>& notes,
787 std::function<bool (shared_ptr<Reel>)> check,
788 std::function<optional<string> (shared_ptr<Reel>)> xml,
789 std::function<int64_t (shared_ptr<Reel>)> duration
792 /* end of last subtitle (in editable units) */
793 optional<int64_t> last_out;
794 auto too_short = false;
795 auto too_close = false;
796 auto too_early = false;
797 auto reel_overlap = false;
798 auto empty_text = false;
799 /* current reel start time (in editable units) */
800 int64_t reel_offset = 0;
802 std::function<void (cxml::ConstNodePtr, optional<int>, optional<Time>, int, bool)> parse;
803 parse = [&parse, &last_out, &too_short, &too_close, &too_early, &empty_text, &reel_offset](cxml::ConstNodePtr node, optional<int> tcr, optional<Time> start_time, int er, bool first_reel) {
804 if (node->name() == "Subtitle") {
805 Time in (node->string_attribute("TimeIn"), tcr);
809 Time out (node->string_attribute("TimeOut"), tcr);
813 if (first_reel && tcr && in < Time(0, 0, 4, 0, *tcr)) {
816 auto length = out - in;
817 if (length.as_editable_units_ceil(er) < 15) {
821 /* XXX: this feels dubious - is it really what Bv2.1 means? */
822 auto distance = reel_offset + in.as_editable_units_ceil(er) - *last_out;
823 if (distance >= 0 && distance < 2) {
827 last_out = reel_offset + out.as_editable_units_floor(er);
828 } else if (node->name() == "Text") {
829 std::function<bool (cxml::ConstNodePtr)> node_has_content = [&](cxml::ConstNodePtr node) {
830 if (!node->content().empty()) {
833 for (auto i: node->node_children()) {
834 if (node_has_content(i)) {
840 if (!node_has_content(node)) {
845 for (auto i: node->node_children()) {
846 parse(i, tcr, start_time, er, first_reel);
850 for (auto i = 0U; i < reels.size(); ++i) {
851 if (!check(reels[i])) {
855 auto reel_xml = xml(reels[i]);
857 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISSED_CHECK_OF_ENCRYPTED});
861 /* We need to look at <Subtitle> instances in the XML being checked, so we can't use the subtitles
862 * read in by libdcp's parser.
865 shared_ptr<cxml::Document> doc;
867 optional<Time> start_time;
869 doc = make_shared<cxml::Document>("SubtitleReel");
870 doc->read_string (*reel_xml);
871 tcr = doc->number_child<int>("TimeCodeRate");
872 auto start_time_string = doc->optional_string_child("StartTime");
873 if (start_time_string) {
874 start_time = Time(*start_time_string, tcr);
877 doc = make_shared<cxml::Document>("DCSubtitle");
878 doc->read_string (*reel_xml);
880 parse (doc, tcr, start_time, edit_rate, i == 0);
881 auto end = reel_offset + duration(reels[i]);
882 if (last_out && *last_out > end) {
888 if (last_out && *last_out > reel_offset) {
894 VerificationNote::Type::WARNING, VerificationNote::Code::INVALID_SUBTITLE_FIRST_TEXT_TIME
900 VerificationNote::Type::WARNING, VerificationNote::Code::INVALID_SUBTITLE_DURATION
906 VerificationNote::Type::WARNING, VerificationNote::Code::INVALID_SUBTITLE_SPACING
912 VerificationNote::Type::ERROR, VerificationNote::Code::SUBTITLE_OVERLAPS_REEL_BOUNDARY
918 VerificationNote::Type::WARNING, VerificationNote::Code::EMPTY_TEXT
926 verify_closed_caption_details (
927 vector<shared_ptr<Reel>> reels,
928 vector<VerificationNote>& notes
931 std::function<void (cxml::ConstNodePtr node, std::vector<cxml::ConstNodePtr>& text_or_image)> find_text_or_image;
932 find_text_or_image = [&find_text_or_image](cxml::ConstNodePtr node, std::vector<cxml::ConstNodePtr>& text_or_image) {
933 for (auto i: node->node_children()) {
934 if (i->name() == "Text") {
935 text_or_image.push_back (i);
937 find_text_or_image (i, text_or_image);
942 auto mismatched_valign = false;
943 auto incorrect_order = false;
945 std::function<void (cxml::ConstNodePtr)> parse;
946 parse = [&parse, &find_text_or_image, &mismatched_valign, &incorrect_order](cxml::ConstNodePtr node) {
947 if (node->name() == "Subtitle") {
948 vector<cxml::ConstNodePtr> text_or_image;
949 find_text_or_image (node, text_or_image);
950 optional<string> last_valign;
951 optional<float> last_vpos;
952 for (auto i: text_or_image) {
953 auto valign = i->optional_string_attribute("VAlign");
955 valign = i->optional_string_attribute("Valign").get_value_or("center");
957 auto vpos = i->optional_number_attribute<float>("VPosition");
959 vpos = i->optional_number_attribute<float>("Vposition").get_value_or(50);
963 if (*last_valign != valign) {
964 mismatched_valign = true;
967 last_valign = valign;
969 if (!mismatched_valign) {
971 if (*last_valign == "top" || *last_valign == "center") {
972 if (*vpos < *last_vpos) {
973 incorrect_order = true;
976 if (*vpos > *last_vpos) {
977 incorrect_order = true;
986 for (auto i: node->node_children()) {
991 for (auto reel: reels) {
992 for (auto ccap: reel->closed_captions()) {
993 auto reel_xml = ccap->asset()->raw_xml();
995 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISSED_CHECK_OF_ENCRYPTED});
999 /* We need to look at <Subtitle> instances in the XML being checked, so we can't use the subtitles
1000 * read in by libdcp's parser.
1003 shared_ptr<cxml::Document> doc;
1005 optional<Time> start_time;
1007 doc = make_shared<cxml::Document>("SubtitleReel");
1008 doc->read_string (*reel_xml);
1010 doc = make_shared<cxml::Document>("DCSubtitle");
1011 doc->read_string (*reel_xml);
1017 if (mismatched_valign) {
1019 VerificationNote::Type::ERROR, VerificationNote::Code::MISMATCHED_CLOSED_CAPTION_VALIGN,
1023 if (incorrect_order) {
1025 VerificationNote::Type::ERROR, VerificationNote::Code::INCORRECT_CLOSED_CAPTION_ORDERING,
1031 struct LinesCharactersResult
1033 bool warning_length_exceeded = false;
1034 bool error_length_exceeded = false;
1035 bool line_count_exceeded = false;
1041 verify_text_lines_and_characters (
1042 shared_ptr<SubtitleAsset> asset,
1045 LinesCharactersResult* result
1051 Event (Time time_, float position_, int characters_)
1053 , position (position_)
1054 , characters (characters_)
1057 Event (Time time_, shared_ptr<Event> start_)
1063 int position; //< position from 0 at top of screen to 100 at bottom
1065 shared_ptr<Event> start;
1068 vector<shared_ptr<Event>> events;
1070 auto position = [](shared_ptr<const SubtitleString> sub) {
1071 switch (sub->v_align()) {
1073 return lrintf(sub->v_position() * 100);
1074 case VAlign::CENTER:
1075 return lrintf((0.5f + sub->v_position()) * 100);
1076 case VAlign::BOTTOM:
1077 return lrintf((1.0f - sub->v_position()) * 100);
1083 for (auto j: asset->subtitles()) {
1084 auto text = dynamic_pointer_cast<const SubtitleString>(j);
1086 auto in = make_shared<Event>(text->in(), position(text), text->text().length());
1087 events.push_back(in);
1088 events.push_back(make_shared<Event>(text->out(), in));
1092 std::sort(events.begin(), events.end(), [](shared_ptr<Event> const& a, shared_ptr<Event>const& b) {
1093 return a->time < b->time;
1096 map<int, int> current;
1097 for (auto i: events) {
1098 if (current.size() > 3) {
1099 result->line_count_exceeded = true;
1101 for (auto j: current) {
1102 if (j.second > warning_length) {
1103 result->warning_length_exceeded = true;
1105 if (j.second > error_length) {
1106 result->error_length_exceeded = true;
1111 /* end of a subtitle */
1112 DCP_ASSERT (current.find(i->start->position) != current.end());
1113 if (current[i->start->position] == i->start->characters) {
1114 current.erase(i->start->position);
1116 current[i->start->position] -= i->start->characters;
1119 /* start of a subtitle */
1120 if (current.find(i->position) == current.end()) {
1121 current[i->position] = i->characters;
1123 current[i->position] += i->characters;
1132 verify_text_details (vector<shared_ptr<Reel>> reels, vector<VerificationNote>& notes)
1134 if (reels.empty()) {
1138 if (reels[0]->main_subtitle()) {
1139 verify_text_details (reels, reels[0]->main_subtitle()->edit_rate().numerator, notes,
1140 [](shared_ptr<Reel> reel) {
1141 return static_cast<bool>(reel->main_subtitle());
1143 [](shared_ptr<Reel> reel) {
1144 auto interop = dynamic_pointer_cast<ReelInteropSubtitleAsset>(reel->main_subtitle());
1146 return interop->asset()->raw_xml();
1148 auto smpte = dynamic_pointer_cast<ReelSMPTESubtitleAsset>(reel->main_subtitle());
1150 return smpte->asset()->raw_xml();
1152 [](shared_ptr<Reel> reel) {
1153 return reel->main_subtitle()->actual_duration();
1158 for (auto i = 0U; i < reels[0]->closed_captions().size(); ++i) {
1159 verify_text_details (reels, reels[0]->closed_captions()[i]->edit_rate().numerator, notes,
1160 [i](shared_ptr<Reel> reel) {
1161 return i < reel->closed_captions().size();
1163 [i](shared_ptr<Reel> reel) {
1164 return reel->closed_captions()[i]->asset()->raw_xml();
1166 [i](shared_ptr<Reel> reel) {
1167 return reel->closed_captions()[i]->actual_duration();
1172 verify_closed_caption_details (reels, notes);
1177 verify_extension_metadata (shared_ptr<CPL> cpl, vector<VerificationNote>& notes)
1179 DCP_ASSERT (cpl->file());
1180 cxml::Document doc ("CompositionPlaylist");
1181 doc.read_file (cpl->file().get());
1183 auto missing = false;
1186 if (auto reel_list = doc.node_child("ReelList")) {
1187 auto reels = reel_list->node_children("Reel");
1188 if (!reels.empty()) {
1189 if (auto asset_list = reels[0]->optional_node_child("AssetList")) {
1190 if (auto metadata = asset_list->optional_node_child("CompositionMetadataAsset")) {
1191 if (auto extension_list = metadata->optional_node_child("ExtensionMetadataList")) {
1193 for (auto extension: extension_list->node_children("ExtensionMetadata")) {
1194 if (extension->optional_string_attribute("scope").get_value_or("") != "http://isdcf.com/ns/cplmd/app") {
1198 if (auto name = extension->optional_node_child("Name")) {
1199 if (name->content() != "Application") {
1200 malformed = "<Name> should be 'Application'";
1203 if (auto property_list = extension->optional_node_child("PropertyList")) {
1204 if (auto property = property_list->optional_node_child("Property")) {
1205 if (auto name = property->optional_node_child("Name")) {
1206 if (name->content() != "DCP Constraints Profile") {
1207 malformed = "<Name> property should be 'DCP Constraints Profile'";
1210 if (auto value = property->optional_node_child("Value")) {
1211 if (value->content() != "SMPTE-RDD-52:2020-Bv2.1") {
1212 malformed = "<Value> property should be 'SMPTE-RDD-52:2020-Bv2.1'";
1227 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_EXTENSION_METADATA, cpl->id(), cpl->file().get()});
1228 } else if (!malformed.empty()) {
1229 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_EXTENSION_METADATA, malformed, cpl->file().get()});
1235 pkl_has_encrypted_assets (shared_ptr<DCP> dcp, shared_ptr<PKL> pkl)
1237 vector<string> encrypted;
1238 for (auto i: dcp->cpls()) {
1239 for (auto j: i->reel_file_assets()) {
1240 if (j->asset_ref().resolved()) {
1241 auto mxf = dynamic_pointer_cast<MXF>(j->asset_ref().asset());
1242 if (mxf && mxf->encrypted()) {
1243 encrypted.push_back(j->asset_ref().id());
1249 for (auto i: pkl->asset_list()) {
1250 if (find(encrypted.begin(), encrypted.end(), i->id()) != encrypted.end()) {
1259 vector<VerificationNote>
1261 vector<boost::filesystem::path> directories,
1262 function<void (string, optional<boost::filesystem::path>)> stage,
1263 function<void (float)> progress,
1264 optional<boost::filesystem::path> xsd_dtd_directory
1267 if (!xsd_dtd_directory) {
1268 xsd_dtd_directory = resources_directory() / "xsd";
1270 *xsd_dtd_directory = boost::filesystem::canonical (*xsd_dtd_directory);
1272 vector<VerificationNote> notes;
1275 vector<shared_ptr<DCP>> dcps;
1276 for (auto i: directories) {
1277 dcps.push_back (make_shared<DCP>(i));
1280 for (auto dcp: dcps) {
1281 stage ("Checking DCP", dcp->directory());
1282 bool carry_on = true;
1284 dcp->read (¬es, true);
1285 } catch (MissingAssetmapError& e) {
1286 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::FAILED_READ, string(e.what())});
1288 } catch (ReadError& e) {
1289 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::FAILED_READ, string(e.what())});
1290 } catch (XMLError& e) {
1291 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::FAILED_READ, string(e.what())});
1292 } catch (MXFFileError& e) {
1293 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::FAILED_READ, string(e.what())});
1294 } catch (cxml::Error& e) {
1295 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::FAILED_READ, string(e.what())});
1302 if (dcp->standard() != Standard::SMPTE) {
1303 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_STANDARD});
1306 for (auto cpl: dcp->cpls()) {
1307 stage ("Checking CPL", cpl->file());
1308 validate_xml (cpl->file().get(), *xsd_dtd_directory, notes);
1310 if (cpl->any_encrypted() && !cpl->all_encrypted()) {
1311 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::PARTIALLY_ENCRYPTED});
1314 for (auto const& i: cpl->additional_subtitle_languages()) {
1315 verify_language_tag (i, notes);
1318 if (cpl->release_territory()) {
1319 if (!cpl->release_territory_scope() || cpl->release_territory_scope().get() != "http://www.smpte-ra.org/schemas/429-16/2014/CPL-Metadata#scope/release-territory/UNM49") {
1320 auto terr = cpl->release_territory().get();
1321 /* Must be a valid region tag, or "001" */
1323 LanguageTag::RegionSubtag test (terr);
1325 if (terr != "001") {
1326 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_LANGUAGE, terr});
1332 if (dcp->standard() == Standard::SMPTE) {
1333 if (!cpl->annotation_text()) {
1334 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_CPL_ANNOTATION_TEXT, cpl->id(), cpl->file().get()});
1335 } else if (cpl->annotation_text().get() != cpl->content_title_text()) {
1336 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISMATCHED_CPL_ANNOTATION_TEXT, cpl->id(), cpl->file().get()});
1340 for (auto i: dcp->pkls()) {
1341 /* Check that the CPL's hash corresponds to the PKL */
1342 optional<string> h = i->hash(cpl->id());
1343 if (h && make_digest(ArrayData(*cpl->file())) != *h) {
1344 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::MISMATCHED_CPL_HASHES, cpl->id(), cpl->file().get()});
1347 /* Check that any PKL with a single CPL has its AnnotationText the same as the CPL's ContentTitleText */
1348 optional<string> required_annotation_text;
1349 for (auto j: i->asset_list()) {
1350 /* See if this is a CPL */
1351 for (auto k: dcp->cpls()) {
1352 if (j->id() == k->id()) {
1353 if (!required_annotation_text) {
1354 /* First CPL we have found; this is the required AnnotationText unless we find another */
1355 required_annotation_text = cpl->content_title_text();
1357 /* There's more than one CPL so we don't care what the PKL's AnnotationText is */
1358 required_annotation_text = boost::none;
1364 if (required_annotation_text && i->annotation_text() != required_annotation_text) {
1365 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISMATCHED_PKL_ANNOTATION_TEXT_WITH_CPL, i->id(), i->file().get()});
1369 /* set to true if any reel has a MainSubtitle */
1370 auto have_main_subtitle = false;
1371 /* set to true if any reel has no MainSubtitle */
1372 auto have_no_main_subtitle = false;
1373 /* fewest number of closed caption assets seen in a reel */
1374 size_t fewest_closed_captions = SIZE_MAX;
1375 /* most number of closed caption assets seen in a reel */
1376 size_t most_closed_captions = 0;
1377 map<Marker, Time> markers_seen;
1379 for (auto reel: cpl->reels()) {
1380 stage ("Checking reel", optional<boost::filesystem::path>());
1382 for (auto i: reel->assets()) {
1383 if (i->duration() && (i->duration().get() * i->edit_rate().denominator / i->edit_rate().numerator) < 1) {
1384 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::INVALID_DURATION, i->id()});
1386 if ((i->intrinsic_duration() * i->edit_rate().denominator / i->edit_rate().numerator) < 1) {
1387 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::INVALID_INTRINSIC_DURATION, i->id()});
1389 auto file_asset = dynamic_pointer_cast<ReelFileAsset>(i);
1390 if (i->encryptable() && !file_asset->hash()) {
1391 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_HASH, i->id()});
1395 if (dcp->standard() == Standard::SMPTE) {
1396 boost::optional<int64_t> duration;
1397 for (auto i: reel->assets()) {
1399 duration = i->actual_duration();
1400 } else if (*duration != i->actual_duration()) {
1401 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISMATCHED_ASSET_DURATION});
1407 if (reel->main_picture()) {
1408 /* Check reel stuff */
1409 auto const frame_rate = reel->main_picture()->frame_rate();
1410 if (frame_rate.denominator != 1 ||
1411 (frame_rate.numerator != 24 &&
1412 frame_rate.numerator != 25 &&
1413 frame_rate.numerator != 30 &&
1414 frame_rate.numerator != 48 &&
1415 frame_rate.numerator != 50 &&
1416 frame_rate.numerator != 60 &&
1417 frame_rate.numerator != 96)) {
1419 VerificationNote::Type::ERROR,
1420 VerificationNote::Code::INVALID_PICTURE_FRAME_RATE,
1421 String::compose("%1/%2", frame_rate.numerator, frame_rate.denominator)
1425 if (reel->main_picture()->asset_ref().resolved()) {
1426 verify_main_picture_asset (dcp, reel->main_picture(), stage, progress, notes);
1430 if (reel->main_sound() && reel->main_sound()->asset_ref().resolved()) {
1431 verify_main_sound_asset (dcp, reel->main_sound(), stage, progress, notes);
1434 if (reel->main_subtitle()) {
1435 verify_main_subtitle_reel (reel->main_subtitle(), notes);
1436 if (reel->main_subtitle()->asset_ref().resolved()) {
1437 verify_subtitle_asset (reel->main_subtitle()->asset(), reel->main_subtitle()->duration(), stage, *xsd_dtd_directory, notes, state);
1439 have_main_subtitle = true;
1441 have_no_main_subtitle = true;
1444 for (auto i: reel->closed_captions()) {
1445 verify_closed_caption_reel (i, notes);
1446 if (i->asset_ref().resolved()) {
1447 verify_closed_caption_asset (i->asset(), i->duration(), stage, *xsd_dtd_directory, notes);
1451 if (reel->main_markers()) {
1452 for (auto const& i: reel->main_markers()->get()) {
1453 markers_seen.insert (i);
1455 if (reel->main_markers()->entry_point()) {
1456 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::UNEXPECTED_ENTRY_POINT});
1458 if (reel->main_markers()->duration()) {
1459 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::UNEXPECTED_DURATION});
1463 fewest_closed_captions = std::min (fewest_closed_captions, reel->closed_captions().size());
1464 most_closed_captions = std::max (most_closed_captions, reel->closed_captions().size());
1467 verify_text_details (cpl->reels(), notes);
1469 if (dcp->standard() == Standard::SMPTE) {
1471 if (have_main_subtitle && have_no_main_subtitle) {
1472 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_MAIN_SUBTITLE_FROM_SOME_REELS});
1475 if (fewest_closed_captions != most_closed_captions) {
1476 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISMATCHED_CLOSED_CAPTION_ASSET_COUNTS});
1479 if (cpl->content_kind() == ContentKind::FEATURE) {
1480 if (markers_seen.find(Marker::FFEC) == markers_seen.end()) {
1481 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_FFEC_IN_FEATURE});
1483 if (markers_seen.find(Marker::FFMC) == markers_seen.end()) {
1484 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_FFMC_IN_FEATURE});
1488 auto ffoc = markers_seen.find(Marker::FFOC);
1489 if (ffoc == markers_seen.end()) {
1490 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISSING_FFOC});
1491 } else if (ffoc->second.e != 1) {
1492 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::INCORRECT_FFOC, raw_convert<string>(ffoc->second.e)});
1495 auto lfoc = markers_seen.find(Marker::LFOC);
1496 if (lfoc == markers_seen.end()) {
1497 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::MISSING_LFOC});
1499 auto lfoc_time = lfoc->second.as_editable_units_ceil(lfoc->second.tcr);
1500 if (lfoc_time != (cpl->reels().back()->duration() - 1)) {
1501 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::INCORRECT_LFOC, raw_convert<string>(lfoc_time)});
1505 LinesCharactersResult result;
1506 for (auto reel: cpl->reels()) {
1507 if (reel->main_subtitle() && reel->main_subtitle()->asset()) {
1508 verify_text_lines_and_characters (reel->main_subtitle()->asset(), 52, 79, &result);
1512 if (result.line_count_exceeded) {
1513 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::INVALID_SUBTITLE_LINE_COUNT});
1515 if (result.error_length_exceeded) {
1516 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::INVALID_SUBTITLE_LINE_LENGTH});
1517 } else if (result.warning_length_exceeded) {
1518 notes.push_back ({VerificationNote::Type::WARNING, VerificationNote::Code::NEARLY_INVALID_SUBTITLE_LINE_LENGTH});
1521 result = LinesCharactersResult();
1522 for (auto reel: cpl->reels()) {
1523 for (auto i: reel->closed_captions()) {
1525 verify_text_lines_and_characters (i->asset(), 32, 32, &result);
1530 if (result.line_count_exceeded) {
1531 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_CLOSED_CAPTION_LINE_COUNT});
1533 if (result.error_length_exceeded) {
1534 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::INVALID_CLOSED_CAPTION_LINE_LENGTH});
1537 if (!cpl->full_content_title_text()) {
1538 /* Since FullContentTitleText is assumed always to exist if there's a CompositionMetadataAsset we
1539 * can use it as a proxy for CompositionMetadataAsset's existence.
1541 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_CPL_METADATA, cpl->id(), cpl->file().get()});
1542 } else if (!cpl->version_number()) {
1543 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::MISSING_CPL_METADATA_VERSION_NUMBER, cpl->id(), cpl->file().get()});
1546 verify_extension_metadata (cpl, notes);
1548 if (cpl->any_encrypted()) {
1549 cxml::Document doc ("CompositionPlaylist");
1550 DCP_ASSERT (cpl->file());
1551 doc.read_file (cpl->file().get());
1552 if (!doc.optional_node_child("Signature")) {
1553 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::UNSIGNED_CPL_WITH_ENCRYPTED_CONTENT, cpl->id(), cpl->file().get()});
1559 for (auto pkl: dcp->pkls()) {
1560 stage ("Checking PKL", pkl->file());
1561 validate_xml (pkl->file().get(), *xsd_dtd_directory, notes);
1562 if (pkl_has_encrypted_assets(dcp, pkl)) {
1563 cxml::Document doc ("PackingList");
1564 doc.read_file (pkl->file().get());
1565 if (!doc.optional_node_child("Signature")) {
1566 notes.push_back ({VerificationNote::Type::BV21_ERROR, VerificationNote::Code::UNSIGNED_PKL_WITH_ENCRYPTED_CONTENT, pkl->id(), pkl->file().get()});
1571 if (dcp->asset_map_path()) {
1572 stage ("Checking ASSETMAP", dcp->asset_map_path().get());
1573 validate_xml (dcp->asset_map_path().get(), *xsd_dtd_directory, notes);
1575 notes.push_back ({VerificationNote::Type::ERROR, VerificationNote::Code::MISSING_ASSETMAP});
1584 dcp::note_to_string (VerificationNote note)
1586 /** These strings should say what is wrong, incorporating any extra details (ID, filenames etc.).
1588 * e.g. "ClosedCaption asset has no <EntryPoint> tag.",
1589 * not "ClosedCaption assets must have an <EntryPoint> tag."
1591 * It's OK to use XML tag names where they are clear.
1592 * If both ID and filename are available, use only the ID.
1593 * End messages with a full stop.
1594 * Messages should not mention whether or not their errors are a part of Bv2.1.
1596 switch (note.code()) {
1597 case VerificationNote::Code::FAILED_READ:
1598 return *note.note();
1599 case VerificationNote::Code::MISMATCHED_CPL_HASHES:
1600 return String::compose("The hash of the CPL %1 in the PKL does not agree with the CPL file.", note.note().get());
1601 case VerificationNote::Code::INVALID_PICTURE_FRAME_RATE:
1602 return String::compose("The picture in a reel has an invalid frame rate %1.", note.note().get());
1603 case VerificationNote::Code::INCORRECT_PICTURE_HASH:
1604 return String::compose("The hash of the picture asset %1 does not agree with the PKL file.", note.file()->filename());
1605 case VerificationNote::Code::MISMATCHED_PICTURE_HASHES:
1606 return String::compose("The PKL and CPL hashes differ for the picture asset %1.", note.file()->filename());
1607 case VerificationNote::Code::INCORRECT_SOUND_HASH:
1608 return String::compose("The hash of the sound asset %1 does not agree with the PKL file.", note.file()->filename());
1609 case VerificationNote::Code::MISMATCHED_SOUND_HASHES:
1610 return String::compose("The PKL and CPL hashes differ for the sound asset %1.", note.file()->filename());
1611 case VerificationNote::Code::EMPTY_ASSET_PATH:
1612 return "The asset map contains an empty asset path.";
1613 case VerificationNote::Code::MISSING_ASSET:
1614 return String::compose("The file %1 for an asset in the asset map cannot be found.", note.file()->filename());
1615 case VerificationNote::Code::MISMATCHED_STANDARD:
1616 return "The DCP contains both SMPTE and Interop parts.";
1617 case VerificationNote::Code::INVALID_XML:
1618 return String::compose("An XML file is badly formed: %1 (%2:%3)", note.note().get(), note.file()->filename(), note.line().get());
1619 case VerificationNote::Code::MISSING_ASSETMAP:
1620 return "No ASSETMAP or ASSETMAP.xml was found.";
1621 case VerificationNote::Code::INVALID_INTRINSIC_DURATION:
1622 return String::compose("The intrinsic duration of the asset %1 is less than 1 second.", note.note().get());
1623 case VerificationNote::Code::INVALID_DURATION:
1624 return String::compose("The duration of the asset %1 is less than 1 second.", note.note().get());
1625 case VerificationNote::Code::INVALID_PICTURE_FRAME_SIZE_IN_BYTES:
1626 return String::compose("The instantaneous bit rate of the picture asset %1 is larger than the limit of 250Mbit/s in at least one place.", note.file()->filename());
1627 case VerificationNote::Code::NEARLY_INVALID_PICTURE_FRAME_SIZE_IN_BYTES:
1628 return String::compose("The instantaneous bit rate of the picture asset %1 is close to the limit of 250Mbit/s in at least one place.", note.file()->filename());
1629 case VerificationNote::Code::EXTERNAL_ASSET:
1630 return String::compose("The asset %1 that this DCP refers to is not included in the DCP. It may be a VF.", note.note().get());
1631 case VerificationNote::Code::THREED_ASSET_MARKED_AS_TWOD:
1632 return String::compose("The asset %1 is 3D but its MXF is marked as 2D.", note.file()->filename());
1633 case VerificationNote::Code::INVALID_STANDARD:
1634 return "This DCP does not use the SMPTE standard.";
1635 case VerificationNote::Code::INVALID_LANGUAGE:
1636 return String::compose("The DCP specifies a language '%1' which does not conform to the RFC 5646 standard.", note.note().get());
1637 case VerificationNote::Code::INVALID_PICTURE_SIZE_IN_PIXELS:
1638 return String::compose("The size %1 of picture asset %2 is not allowed.", note.note().get(), note.file()->filename());
1639 case VerificationNote::Code::INVALID_PICTURE_FRAME_RATE_FOR_2K:
1640 return String::compose("The frame rate %1 of picture asset %2 is not allowed for 2K DCPs.", note.note().get(), note.file()->filename());
1641 case VerificationNote::Code::INVALID_PICTURE_FRAME_RATE_FOR_4K:
1642 return String::compose("The frame rate %1 of picture asset %2 is not allowed for 4K DCPs.", note.note().get(), note.file()->filename());
1643 case VerificationNote::Code::INVALID_PICTURE_ASSET_RESOLUTION_FOR_3D:
1644 return "3D 4K DCPs are not allowed.";
1645 case VerificationNote::Code::INVALID_CLOSED_CAPTION_XML_SIZE_IN_BYTES:
1646 return String::compose("The size %1 of the closed caption asset %2 is larger than the 256KB maximum.", note.note().get(), note.file()->filename());
1647 case VerificationNote::Code::INVALID_TIMED_TEXT_SIZE_IN_BYTES:
1648 return String::compose("The size %1 of the timed text asset %2 is larger than the 115MB maximum.", note.note().get(), note.file()->filename());
1649 case VerificationNote::Code::INVALID_TIMED_TEXT_FONT_SIZE_IN_BYTES:
1650 return String::compose("The size %1 of the fonts in timed text asset %2 is larger than the 10MB maximum.", note.note().get(), note.file()->filename());
1651 case VerificationNote::Code::MISSING_SUBTITLE_LANGUAGE:
1652 return String::compose("The XML for the SMPTE subtitle asset %1 has no <Language> tag.", note.file()->filename());
1653 case VerificationNote::Code::MISMATCHED_SUBTITLE_LANGUAGES:
1654 return "Some subtitle assets have different <Language> tags than others";
1655 case VerificationNote::Code::MISSING_SUBTITLE_START_TIME:
1656 return String::compose("The XML for the SMPTE subtitle asset %1 has no <StartTime> tag.", note.file()->filename());
1657 case VerificationNote::Code::INVALID_SUBTITLE_START_TIME:
1658 return String::compose("The XML for a SMPTE subtitle asset %1 has a non-zero <StartTime> tag.", note.file()->filename());
1659 case VerificationNote::Code::INVALID_SUBTITLE_FIRST_TEXT_TIME:
1660 return "The first subtitle or closed caption is less than 4 seconds from the start of the DCP.";
1661 case VerificationNote::Code::INVALID_SUBTITLE_DURATION:
1662 return "At least one subtitle lasts less than 15 frames.";
1663 case VerificationNote::Code::INVALID_SUBTITLE_SPACING:
1664 return "At least one pair of subtitles is separated by less than 2 frames.";
1665 case VerificationNote::Code::SUBTITLE_OVERLAPS_REEL_BOUNDARY:
1666 return "At least one subtitle extends outside of its reel.";
1667 case VerificationNote::Code::INVALID_SUBTITLE_LINE_COUNT:
1668 return "There are more than 3 subtitle lines in at least one place in the DCP.";
1669 case VerificationNote::Code::NEARLY_INVALID_SUBTITLE_LINE_LENGTH:
1670 return "There are more than 52 characters in at least one subtitle line.";
1671 case VerificationNote::Code::INVALID_SUBTITLE_LINE_LENGTH:
1672 return "There are more than 79 characters in at least one subtitle line.";
1673 case VerificationNote::Code::INVALID_CLOSED_CAPTION_LINE_COUNT:
1674 return "There are more than 3 closed caption lines in at least one place.";
1675 case VerificationNote::Code::INVALID_CLOSED_CAPTION_LINE_LENGTH:
1676 return "There are more than 32 characters in at least one closed caption line.";
1677 case VerificationNote::Code::INVALID_SOUND_FRAME_RATE:
1678 return String::compose("The sound asset %1 has a sampling rate of %2", note.file()->filename(), note.note().get());
1679 case VerificationNote::Code::MISSING_CPL_ANNOTATION_TEXT:
1680 return String::compose("The CPL %1 has no <AnnotationText> tag.", note.note().get());
1681 case VerificationNote::Code::MISMATCHED_CPL_ANNOTATION_TEXT:
1682 return String::compose("The CPL %1 has an <AnnotationText> which differs from its <ContentTitleText>", note.note().get());
1683 case VerificationNote::Code::MISMATCHED_ASSET_DURATION:
1684 return "All assets in a reel do not have the same duration.";
1685 case VerificationNote::Code::MISSING_MAIN_SUBTITLE_FROM_SOME_REELS:
1686 return "At least one reel contains a subtitle asset, but some reel(s) do not";
1687 case VerificationNote::Code::MISMATCHED_CLOSED_CAPTION_ASSET_COUNTS:
1688 return "At least one reel has closed captions, but reels have different numbers of closed caption assets.";
1689 case VerificationNote::Code::MISSING_SUBTITLE_ENTRY_POINT:
1690 return String::compose("The subtitle asset %1 has no <EntryPoint> tag.", note.note().get());
1691 case VerificationNote::Code::INCORRECT_SUBTITLE_ENTRY_POINT:
1692 return String::compose("The subtitle asset %1 has an <EntryPoint> other than 0.", note.note().get());
1693 case VerificationNote::Code::MISSING_CLOSED_CAPTION_ENTRY_POINT:
1694 return String::compose("The closed caption asset %1 has no <EntryPoint> tag.", note.note().get());
1695 case VerificationNote::Code::INCORRECT_CLOSED_CAPTION_ENTRY_POINT:
1696 return String::compose("The closed caption asset %1 has an <EntryPoint> other than 0.", note.note().get());
1697 case VerificationNote::Code::MISSING_HASH:
1698 return String::compose("The asset %1 has no <Hash> tag in the CPL.", note.note().get());
1699 case VerificationNote::Code::MISSING_FFEC_IN_FEATURE:
1700 return "The DCP is marked as a Feature but there is no FFEC (first frame of end credits) marker";
1701 case VerificationNote::Code::MISSING_FFMC_IN_FEATURE:
1702 return "The DCP is marked as a Feature but there is no FFMC (first frame of moving credits) marker";
1703 case VerificationNote::Code::MISSING_FFOC:
1704 return "There should be a FFOC (first frame of content) marker";
1705 case VerificationNote::Code::MISSING_LFOC:
1706 return "There should be a LFOC (last frame of content) marker";
1707 case VerificationNote::Code::INCORRECT_FFOC:
1708 return String::compose("The FFOC marker is %1 instead of 1", note.note().get());
1709 case VerificationNote::Code::INCORRECT_LFOC:
1710 return String::compose("The LFOC marker is %1 instead of 1 less than the duration of the last reel.", note.note().get());
1711 case VerificationNote::Code::MISSING_CPL_METADATA:
1712 return String::compose("The CPL %1 has no <CompositionMetadataAsset> tag.", note.note().get());
1713 case VerificationNote::Code::MISSING_CPL_METADATA_VERSION_NUMBER:
1714 return String::compose("The CPL %1 has no <VersionNumber> in its <CompositionMetadataAsset>.", note.note().get());
1715 case VerificationNote::Code::MISSING_EXTENSION_METADATA:
1716 return String::compose("The CPL %1 has no <ExtensionMetadata> in its <CompositionMetadataAsset>.", note.note().get());
1717 case VerificationNote::Code::INVALID_EXTENSION_METADATA:
1718 return String::compose("The CPL %1 has a malformed <ExtensionMetadata> (%2).", note.file()->filename(), note.note().get());
1719 case VerificationNote::Code::UNSIGNED_CPL_WITH_ENCRYPTED_CONTENT:
1720 return String::compose("The CPL %1, which has encrypted content, is not signed.", note.note().get());
1721 case VerificationNote::Code::UNSIGNED_PKL_WITH_ENCRYPTED_CONTENT:
1722 return String::compose("The PKL %1, which has encrypted content, is not signed.", note.note().get());
1723 case VerificationNote::Code::MISMATCHED_PKL_ANNOTATION_TEXT_WITH_CPL:
1724 return String::compose("The PKL %1 has only one CPL but its <AnnotationText> does not match the CPL's <ContentTitleText>.", note.note().get());
1725 case VerificationNote::Code::PARTIALLY_ENCRYPTED:
1726 return "Some assets are encrypted but some are not.";
1727 case VerificationNote::Code::INVALID_JPEG2000_CODESTREAM:
1728 return String::compose("The JPEG2000 codestream for at least one frame is invalid (%1)", note.note().get());
1729 case VerificationNote::Code::INVALID_JPEG2000_GUARD_BITS_FOR_2K:
1730 return String::compose("The JPEG2000 codestream uses %1 guard bits in a 2K image instead of 1.", note.note().get());
1731 case VerificationNote::Code::INVALID_JPEG2000_GUARD_BITS_FOR_4K:
1732 return String::compose("The JPEG2000 codestream uses %1 guard bits in a 4K image instead of 2.", note.note().get());
1733 case VerificationNote::Code::INVALID_JPEG2000_TILE_SIZE:
1734 return "The JPEG2000 tile size is not the same as the image size.";
1735 case VerificationNote::Code::INVALID_JPEG2000_CODE_BLOCK_WIDTH:
1736 return String::compose("The JPEG2000 codestream uses a code block width of %1 instead of 32.", note.note().get());
1737 case VerificationNote::Code::INVALID_JPEG2000_CODE_BLOCK_HEIGHT:
1738 return String::compose("The JPEG2000 codestream uses a code block height of %1 instead of 32.", note.note().get());
1739 case VerificationNote::Code::INCORRECT_JPEG2000_POC_MARKER_COUNT_FOR_2K:
1740 return String::compose("%1 POC markers found in 2K JPEG2000 codestream instead of 0.", note.note().get());
1741 case VerificationNote::Code::INCORRECT_JPEG2000_POC_MARKER_COUNT_FOR_4K:
1742 return String::compose("%1 POC markers found in 4K JPEG2000 codestream instead of 1.", note.note().get());
1743 case VerificationNote::Code::INCORRECT_JPEG2000_POC_MARKER:
1744 return String::compose("Incorrect POC marker content found (%1)", note.note().get());
1745 case VerificationNote::Code::INVALID_JPEG2000_POC_MARKER_LOCATION:
1746 return "POC marker found outside main header";
1747 case VerificationNote::Code::INVALID_JPEG2000_TILE_PARTS_FOR_2K:
1748 return String::compose("The JPEG2000 codestream has %1 tile parts in a 2K image instead of 3.", note.note().get());
1749 case VerificationNote::Code::INVALID_JPEG2000_TILE_PARTS_FOR_4K:
1750 return String::compose("The JPEG2000 codestream has %1 tile parts in a 4K image instead of 6.", note.note().get());
1751 case VerificationNote::Code::MISSING_JPEG200_TLM_MARKER:
1752 return "No TLM marker was found in a JPEG2000 codestream.";
1753 case VerificationNote::Code::MISMATCHED_TIMED_TEXT_RESOURCE_ID:
1754 return "The Resource ID in a timed text MXF did not match the ID of the contained XML.";
1755 case VerificationNote::Code::INCORRECT_TIMED_TEXT_ASSET_ID:
1756 return "The Asset ID in a timed text MXF is the same as the Resource ID or that of the contained XML.";
1757 case VerificationNote::Code::MISMATCHED_TIMED_TEXT_DURATION:
1759 vector<string> parts;
1760 boost::split (parts, note.note().get(), boost::is_any_of(" "));
1761 DCP_ASSERT (parts.size() == 2);
1762 return String::compose("The reel duration of some timed text (%1) is not the same as the ContainerDuration of its MXF (%2).", parts[0], parts[1]);
1764 case VerificationNote::Code::MISSED_CHECK_OF_ENCRYPTED:
1765 return "Some aspect of this DCP could not be checked because it is encrypted.";
1766 case VerificationNote::Code::EMPTY_TEXT:
1767 return "There is an empty <Text> node in a subtitle or closed caption.";
1768 case VerificationNote::Code::MISMATCHED_CLOSED_CAPTION_VALIGN:
1769 return "Some closed <Text> or <Image> nodes have different vertical alignments within a <Subtitle>.";
1770 case VerificationNote::Code::INCORRECT_CLOSED_CAPTION_ORDERING:
1771 return "Some closed captions are not listed in the order of their vertical position.";
1772 case VerificationNote::Code::UNEXPECTED_ENTRY_POINT:
1773 return "There is an <EntryPoint> node inside a <MainMarkers>.";
1774 case VerificationNote::Code::UNEXPECTED_DURATION:
1775 return "There is an <Duration> node inside a <MainMarkers>.";
1783 dcp::operator== (dcp::VerificationNote const& a, dcp::VerificationNote const& b)
1785 return a.type() == b.type() && a.code() == b.code() && a.note() == b.note() && a.file() == b.file() && a.line() == b.line();
1790 dcp::operator< (dcp::VerificationNote const& a, dcp::VerificationNote const& b)
1792 if (a.type() != b.type()) {
1793 return a.type() < b.type();
1796 if (a.code() != b.code()) {
1797 return a.code() < b.code();
1800 if (a.note() != b.note()) {
1801 return a.note().get_value_or("") < b.note().get_value_or("");
1804 if (a.file() != b.file()) {
1805 return a.file().get_value_or("") < b.file().get_value_or("");
1808 return a.line().get_value_or(0) < b.line().get_value_or(0);
1813 dcp::operator<< (std::ostream& s, dcp::VerificationNote const& note)
1815 s << note_to_string (note);
1817 s << " [" << note.note().get() << "]";
1820 s << " [" << note.file().get() << "]";
1823 s << " [" << note.line().get() << "]";