/*
- Copyright (C) 2018-2019 Carl Hetherington <cth@carlh.net>
+ Copyright (C) 2018-2020 Carl Hetherington <cth@carlh.net>
This file is part of libdcp.
#include "exceptions.h"
#include "compose.hpp"
#include "raw_convert.h"
+#include <xercesc/util/PlatformUtils.hpp>
+#include <xercesc/parsers/XercesDOMParser.hpp>
+#include <xercesc/parsers/AbstractDOMParser.hpp>
+#include <xercesc/sax/HandlerBase.hpp>
+#include <xercesc/dom/DOMImplementation.hpp>
+#include <xercesc/dom/DOMImplementationLS.hpp>
+#include <xercesc/dom/DOMImplementationRegistry.hpp>
+#include <xercesc/dom/DOMLSParser.hpp>
+#include <xercesc/dom/DOMException.hpp>
+#include <xercesc/dom/DOMDocument.hpp>
+#include <xercesc/dom/DOMNodeList.hpp>
+#include <xercesc/dom/DOMError.hpp>
+#include <xercesc/dom/DOMLocator.hpp>
+#include <xercesc/dom/DOMNamedNodeMap.hpp>
+#include <xercesc/dom/DOMAttr.hpp>
+#include <xercesc/dom/DOMErrorHandler.hpp>
+#include <xercesc/framework/LocalFileInputSource.hpp>
+#include <boost/noncopyable.hpp>
#include <boost/foreach.hpp>
#include <boost/algorithm/string.hpp>
-#include <boost/regex.hpp>
+#include <map>
#include <list>
#include <vector>
#include <iostream>
using std::vector;
using std::string;
using std::cout;
+using std::map;
using boost::shared_ptr;
using boost::optional;
using boost::function;
using namespace dcp;
+using namespace xercesc;
enum Result {
RESULT_GOOD,
RESULT_BAD
};
+static
+string
+xml_ch_to_string (XMLCh const * a)
+{
+ char* x = XMLString::transcode(a);
+ string const o(x);
+ XMLString::release(&x);
+ return o;
+}
+
+class XMLValidationError
+{
+public:
+ XMLValidationError (SAXParseException const & e)
+ : _message (xml_ch_to_string(e.getMessage()))
+ , _line (e.getLineNumber())
+ , _column (e.getColumnNumber())
+ {
+
+ }
+
+ string message () const {
+ return _message;
+ }
+
+ uint64_t line () const {
+ return _line;
+ }
+
+ uint64_t column () const {
+ return _column;
+ }
+
+private:
+ string _message;
+ uint64_t _line;
+ uint64_t _column;
+};
+
+
+class DCPErrorHandler : public ErrorHandler
+{
+public:
+ void warning(const SAXParseException& e)
+ {
+ maybe_add (XMLValidationError(e));
+ }
+
+ void error(const SAXParseException& e)
+ {
+ maybe_add (XMLValidationError(e));
+ }
+
+ void fatalError(const SAXParseException& e)
+ {
+ maybe_add (XMLValidationError(e));
+ }
+
+ void resetErrors() {
+ _errors.clear ();
+ }
+
+ list<XMLValidationError> errors () const {
+ return _errors;
+ }
+
+private:
+ void maybe_add (XMLValidationError e)
+ {
+ /* XXX: nasty hack */
+ if (
+ e.message().find("schema document") != string::npos &&
+ e.message().find("has different target namespace from the one specified in instance document") != string::npos
+ ) {
+ return;
+ }
+
+ _errors.push_back (e);
+ }
+
+ list<XMLValidationError> _errors;
+};
+
+class StringToXMLCh : public boost::noncopyable
+{
+public:
+ StringToXMLCh (string a)
+ {
+ _buffer = XMLString::transcode(a.c_str());
+ }
+
+ ~StringToXMLCh ()
+ {
+ XMLString::release (&_buffer);
+ }
+
+ XMLCh const * get () const {
+ return _buffer;
+ }
+
+private:
+ XMLCh* _buffer;
+};
+
+class LocalFileResolver : public EntityResolver
+{
+public:
+ LocalFileResolver (boost::filesystem::path xsd_dtd_directory)
+ : _xsd_dtd_directory (xsd_dtd_directory)
+ {
+ add("http://www.w3.org/2001/XMLSchema.dtd", "XMLSchema.dtd");
+ add("http://www.w3.org/2001/03/xml.xsd", "xml.xsd");
+ add("http://www.w3.org/TR/2002/REC-xmldsig-core-20020212/xmldsig-core-schema.xsd", "xmldsig-core-schema.xsd");
+ add("http://www.digicine.com/schemas/437-Y/2007/Main-Stereo-Picture-CPL.xsd", "Main-Stereo-Picture-CPL.xsd");
+ add("http://www.digicine.com/PROTO-ASDCP-CPL-20040511.xsd", "PROTO-ASDCP-CPL-20040511.xsd");
+ add("http://www.digicine.com/PROTO-ASDCP-PKL-20040311.xsd", "PROTO-ASDCP-PKL-20040311.xsd");
+ add("http://www.digicine.com/PROTO-ASDCP-AM-20040311.xsd", "PROTO-ASDCP-AM-20040311.xsd");
+ }
+
+ InputSource* resolveEntity(XMLCh const *, XMLCh const * system_id)
+ {
+ string system_id_str = xml_ch_to_string (system_id);
+ if (_files.find(system_id_str) == _files.end()) {
+ return 0;
+ }
+
+ boost::filesystem::path p = _xsd_dtd_directory / _files[system_id_str];
+ StringToXMLCh ch (p.string());
+ return new LocalFileInputSource(ch.get());
+ }
+
+private:
+ void add (string uri, string file)
+ {
+ _files[uri] = file;
+ }
+
+ std::map<string, string> _files;
+ boost::filesystem::path _xsd_dtd_directory;
+};
+
+static
+void
+validate_xml (boost::filesystem::path xml_file, boost::filesystem::path xsd_dtd_directory, list<VerificationNote>& notes)
+{
+ try {
+ XMLPlatformUtils::Initialize ();
+ } catch (XMLException& e) {
+ throw MiscError ("Failed to initialise xerces library");
+ }
+
+ DCPErrorHandler error_handler;
+
+ /* All the xerces objects in this scope must be destroyed before XMLPlatformUtils::Terminate() is called */
+ {
+ XercesDOMParser parser;
+ parser.setValidationScheme(XercesDOMParser::Val_Always);
+ parser.setDoNamespaces(true);
+ parser.setDoSchema(true);
+
+ map<string, string> schema;
+ schema["http://www.w3.org/2000/09/xmldsig#"] = "xmldsig-core-schema.xsd";
+ schema["http://www.w3.org/TR/2002/REC-xmldsig-core-20020212/xmldsig-core-schema.xsd"] = "xmldsig-core-schema.xsd";
+ schema["http://www.smpte-ra.org/schemas/429-7/2006/CPL"] = "SMPTE-429-7-2006-CPL.xsd";
+ schema["http://www.smpte-ra.org/schemas/429-8/2006/PKL"] = "SMPTE-429-8-2006-PKL.xsd";
+ schema["http://www.smpte-ra.org/schemas/429-9/2007/AM"] = "SMPTE-429-9-2007-AM.xsd";
+ schema["http://www.digicine.com/schemas/437-Y/2007/Main-Stereo-Picture-CPL.xsd"] = "Main-Stereo-Picture-CPL.xsd";
+ schema["http://www.digicine.com/PROTO-ASDCP-CPL-20040511#"] = "PROTO-ASDCP-CPL-20040511.xsd";
+ schema["http://www.digicine.com/PROTO-ASDCP-PKL-20040311#"] = "PROTO-ASDCP-PKL-20040311.xsd";
+ schema["http://www.digicine.com/PROTO-ASDCP-AM-20040311#"] = "PROTO-ASDCP-AM-20040311.xsd";
+
+ string locations;
+ for (map<string, string>::const_iterator i = schema.begin(); i != schema.end(); ++i) {
+ locations += i->first;
+ locations += " ";
+ boost::filesystem::path p = xsd_dtd_directory / i->second;
+ locations += p.string() + " ";
+ }
+
+ parser.setExternalSchemaLocation(locations.c_str());
+ parser.setValidationSchemaFullChecking(true);
+ parser.setErrorHandler(&error_handler);
+
+ LocalFileResolver resolver (xsd_dtd_directory);
+ parser.setEntityResolver(&resolver);
+
+ try {
+ parser.resetDocumentPool();
+ parser.parse(xml_file.string().c_str());
+ } catch (XMLException& e) {
+ throw MiscError(xml_ch_to_string(e.getMessage()));
+ } catch (DOMException& e) {
+ throw MiscError(xml_ch_to_string(e.getMessage()));
+ } catch (...) {
+ throw MiscError("Unknown exception from xerces");
+ }
+ }
+
+ XMLPlatformUtils::Terminate ();
+
+ BOOST_FOREACH (XMLValidationError i, error_handler.errors()) {
+ notes.push_back (
+ VerificationNote(
+ VerificationNote::VERIFY_ERROR,
+ VerificationNote::XML_VALIDATION_ERROR,
+ i.message(),
+ xml_file,
+ i.line()
+ )
+ );
+ }
+}
+
static Result
verify_asset (shared_ptr<DCP> dcp, shared_ptr<ReelMXF> reel_mxf, function<void (float)> progress)
{
return RESULT_GOOD;
}
-static
-bool
-good_urn_uuid (string id)
-{
- boost::regex ex("urn:uuid:[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}");
- return boost::regex_match (id, ex);
-}
-
-static
-bool
-good_date (string date)
-{
- boost::regex ex("\\d{4}-(\\d{2})-(\\d{2})T(\\d{2}):(\\d{2}):(\\d{2})[+-](\\d{2}):(\\d{2})");
- boost::match_results<string::const_iterator> res;
- if (!regex_match (date, res, ex, boost::match_default)) {
- return false;
- }
- int const month = dcp::raw_convert<int>(res[1].str());
- if (month < 1 || month > 12) {
- return false;
- }
- int const day = dcp::raw_convert<int>(res[2].str());
- if (day < 1 || day > 31) {
- return false;
- }
- if (dcp::raw_convert<int>(res[3].str()) > 23) {
- return false;
- }
- if (dcp::raw_convert<int>(res[4].str()) > 59) {
- return false;
- }
- if (dcp::raw_convert<int>(res[5].str()) > 59) {
- return false;
- }
- if (dcp::raw_convert<int>(res[6].str()) > 23) {
- return false;
- }
- if (dcp::raw_convert<int>(res[7].str()) > 59) {
- return false;
- }
- return true;
-}
list<VerificationNote>
-dcp::verify (vector<boost::filesystem::path> directories, function<void (string, optional<boost::filesystem::path>)> stage, function<void (float)> progress)
+dcp::verify (
+ vector<boost::filesystem::path> directories,
+ function<void (string, optional<boost::filesystem::path>)> stage,
+ function<void (float)> progress,
+ boost::filesystem::path xsd_dtd_directory
+ )
{
+ xsd_dtd_directory = boost::filesystem::canonical (xsd_dtd_directory);
+
list<VerificationNote> notes;
list<shared_ptr<DCP> > dcps;
try {
dcp->read (¬es);
} catch (DCPReadError& e) {
- notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::Code::GENERAL_READ, string(e.what())));
+ notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::GENERAL_READ, string(e.what())));
} catch (XMLError& e) {
- notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::Code::GENERAL_READ, string(e.what())));
+ notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::GENERAL_READ, string(e.what())));
}
BOOST_FOREACH (shared_ptr<CPL> cpl, dcp->cpls()) {
stage ("Checking CPL", cpl->file());
-
- cxml::Document cpl_doc ("CompositionPlaylist");
- cpl_doc.read_file (cpl->file().get());
- if (!good_urn_uuid(cpl_doc.string_child("Id"))) {
- notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::Code::BAD_URN_UUID, string("CPL <Id> is malformed")));
- }
- if (!good_date(cpl_doc.string_child("IssueDate"))) {
- notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::Code::BAD_DATE, string("CPL <IssueDate> is malformed")));
- }
+ validate_xml (cpl->file().get(), xsd_dtd_directory, notes);
/* Check that the CPL's hash corresponds to the PKL */
BOOST_FOREACH (shared_ptr<PKL> i, dcp->pkls()) {
BOOST_FOREACH (shared_ptr<Reel> reel, cpl->reels()) {
stage ("Checking reel", optional<boost::filesystem::path>());
+
+ BOOST_FOREACH (shared_ptr<ReelAsset> i, reel->assets()) {
+ if (i->duration() && (i->duration().get() * i->edit_rate().denominator / i->edit_rate().numerator) < 1) {
+ notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::DURATION_TOO_SMALL, i->id()));
+ }
+ if ((i->intrinsic_duration() * i->edit_rate().denominator / i->edit_rate().numerator) < 1) {
+ notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::INTRINSIC_DURATION_TOO_SMALL, i->id()));
+ }
+ }
+
if (reel->main_picture()) {
/* Check reel stuff */
Fraction const frame_rate = reel->main_picture()->frame_rate();
switch (r) {
case RESULT_BAD:
notes.push_back (
- VerificationNote(
- VerificationNote::VERIFY_ERROR, VerificationNote::PICTURE_HASH_INCORRECT, *reel->main_picture()->asset()->file()
- )
- );
+ VerificationNote(
+ VerificationNote::VERIFY_ERROR, VerificationNote::PICTURE_HASH_INCORRECT, *reel->main_picture()->asset()->file()
+ )
+ );
break;
case RESULT_CPL_PKL_DIFFER:
- notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::PKL_CPL_PICTURE_HASHES_DISAGREE));
+ notes.push_back (
+ VerificationNote(
+ VerificationNote::VERIFY_ERROR, VerificationNote::PKL_CPL_PICTURE_HASHES_DISAGREE, *reel->main_picture()->asset()->file()
+ )
+ );
break;
default:
break;
switch (r) {
case RESULT_BAD:
notes.push_back (
- VerificationNote(
- VerificationNote::VERIFY_ERROR, VerificationNote::SOUND_HASH_INCORRECT, *reel->main_sound()->asset()->file()
- )
- );
+ VerificationNote(
+ VerificationNote::VERIFY_ERROR, VerificationNote::SOUND_HASH_INCORRECT, *reel->main_sound()->asset()->file()
+ )
+ );
break;
case RESULT_CPL_PKL_DIFFER:
- notes.push_back (VerificationNote (VerificationNote::VERIFY_ERROR, VerificationNote::PKL_CPL_SOUND_HASHES_DISAGREE));
+ notes.push_back (
+ VerificationNote(
+ VerificationNote::VERIFY_ERROR, VerificationNote::PKL_CPL_SOUND_HASHES_DISAGREE, *reel->main_sound()->asset()->file()
+ )
+ );
break;
default:
break;
}
}
}
+
+ BOOST_FOREACH (shared_ptr<PKL> pkl, dcp->pkls()) {
+ stage ("Checking PKL", pkl->file());
+ validate_xml (pkl->file().get(), xsd_dtd_directory, notes);
+ }
+
+ if (dcp->asset_map_path()) {
+ stage ("Checking ASSETMAP", dcp->asset_map_path().get());
+ validate_xml (dcp->asset_map_path().get(), xsd_dtd_directory, notes);
+ } else {
+ notes.push_back (VerificationNote(VerificationNote::VERIFY_ERROR, VerificationNote::MISSING_ASSETMAP));
+ }
}
return notes;
case dcp::VerificationNote::PICTURE_HASH_INCORRECT:
return dcp::String::compose("The hash of the picture asset %1 does not agree with the PKL file", note.file()->filename());
case dcp::VerificationNote::PKL_CPL_PICTURE_HASHES_DISAGREE:
- return "The PKL and CPL hashes disagree for a picture asset.";
+ return dcp::String::compose("The PKL and CPL hashes disagree for the picture asset %1", note.file()->filename());
case dcp::VerificationNote::SOUND_HASH_INCORRECT:
return dcp::String::compose("The hash of the sound asset %1 does not agree with the PKL file", note.file()->filename());
case dcp::VerificationNote::PKL_CPL_SOUND_HASHES_DISAGREE:
- return "The PKL and CPL hashes disagree for a sound asset.";
+ return dcp::String::compose("The PKL and CPL hashes disagree for the sound asset %1", note.file()->filename());
case dcp::VerificationNote::EMPTY_ASSET_PATH:
return "The asset map contains an empty asset path.";
case dcp::VerificationNote::MISSING_ASSET:
- return "The file for an asset in the asset map cannot be found.";
+ return String::compose("The file for an asset in the asset map cannot be found; missing file is %1.", note.file()->filename());
case dcp::VerificationNote::MISMATCHED_STANDARD:
return "The DCP contains both SMPTE and Interop parts.";
- case dcp::VerificationNote::BAD_URN_UUID:
- return "There is a badly-formed urn:uuid.";
- case dcp::VerificationNote::BAD_DATE:
- return "There is a badly-formed date.";
+ case dcp::VerificationNote::XML_VALIDATION_ERROR:
+ return String::compose("An XML file is badly formed: %1 (%2:%3)", note.note().get(), note.file()->filename(), note.line().get());
+ case dcp::VerificationNote::MISSING_ASSETMAP:
+ return "No ASSETMAP or ASSETMAP.xml was found";
+ case dcp::VerificationNote::INTRINSIC_DURATION_TOO_SMALL:
+ return String::compose("The intrinsic duration of an asset is less than 1 second long: %1", note.note().get());
+ case dcp::VerificationNote::DURATION_TOO_SMALL:
+ return String::compose("The duration of an asset is less than 1 second long: %1", note.note().get());
}
return "";
}
-