// ***************************************************************************** // * This file is part of the FreeFileSync project. It is distributed under * // * GNU General Public License: https://www.gnu.org/licenses/gpl-3.0 * // * Copyright (C) Zenju (zenju AT freefilesync DOT org) - All Rights Reserved * // ***************************************************************************** #ifndef XML_H_349578228034572457454554 #define XML_H_349578228034572457454554 #include #include #include #include "cvrt_struc.h" #include "parser.h" /// The zen::Xml namespace namespace zen { /** \file \brief Save and load byte streams from files */ ///Load XML document from a file /** Load and parse XML byte stream. Quick-exit if (potentially large) input file is not an XML. \param filePath Input file path \returns The loaded XML document \throw FileError */ namespace { XmlDoc loadXml(const Zstring& filePath) //throw FileError { FileInputPlain fileIn(filePath); //throw FileError const size_t blockSize = fileIn.getBlockSize(); //throw FileError bool xmlPrefixChecked = false; std::string buffer; for (;;) { warn_static("don't need zero-initialization! => resize_and_overwrite") buffer.resize(buffer.size() + blockSize); const size_t bytesRead = fileIn.tryRead(&*(buffer.end() - blockSize), blockSize); //throw FileError; may return short, only 0 means EOF! CONTRACT: bytesToRead > 0! buffer.resize(buffer.size() - blockSize + bytesRead); //caveat: unsigned arithmetics //quick test whether input is an XML: avoid loading large binary files up front! if (!xmlPrefixChecked && buffer.size() >= strLength(BYTE_ORDER_MARK_UTF8) + strLength("")) { xmlPrefixChecked = true; std::string_view bufStart = buffer; if (startsWith(bufStart, BYTE_ORDER_MARK_UTF8)) bufStart.remove_prefix(strLength(BYTE_ORDER_MARK_UTF8)); if (!startsWith(bufStart, "")) throw FileError(replaceCpy(_("File %x does not contain a valid configuration."), L"%x", fmtPath(filePath))); } if (bytesRead == 0) //end of file break; } try { return parseXml(buffer); //throw XmlParsingError } catch (const XmlParsingError& e) { throw FileError( replaceCpy(replaceCpy(replaceCpy(_("Error parsing file %x, row %y, column %z."), L"%x", fmtPath(filePath)), L"%y", formatNumber(e.row + 1)), L"%z", formatNumber(e.col + 1))); } } } ///Save XML document to a file /** Serialize XML to byte stream and save to file. \param doc The XML document to save \param filePath Output file path \throw FileError */ inline void saveXml(const XmlDoc& doc, const Zstring& filePath) //throw FileError { const std::string stream = serializeXml(doc); //noexcept try //only update XML file if there are changes { if (getFileSize(filePath) == stream.size()) //throw FileError if (getFileContent(filePath, nullptr /*notifyUnbufferedIO*/) == stream) //throw FileError return; } catch (FileError&) {} setFileContent(filePath, stream, nullptr /*notifyUnbufferedIO*/); //throw FileError } ///Proxy class to conveniently convert user data into XML structure class XmlOut { public: ///Construct an output proxy for an XML document /** \code zen::XmlDoc doc; zen::XmlOut out(doc); out["elem1"]( 1); // out["elem2"]( 2); //write data into XML elements out["elem3"](-3); // saveXml(doc, "out.xml"); //throw FileError \endcode Output: \verbatim 1 2 -3 \endverbatim */ explicit XmlOut(XmlDoc& doc) : ref_(&doc.root()) {} ///Retrieve a handle to an XML child element for writing /** The child element will be created if it is not yet existing. \param name The name of the child element */ XmlOut operator[](std::string name) const { XmlElement* child = ref_->getChild(name); return XmlOut(child ? *child : ref_->addChild(std::move(name))); } ///Retrieve a handle to an XML child element for writing /** The child element will be added, allowing for multiple elements with the same name. \tparam String Arbitrary string-like type: e.g. std::string, wchar_t*, char[], wchar_t, wxString, MyStringClass, ... \param name The name of the child element */ XmlOut addChild(std::string name) const { return XmlOut(ref_->addChild(std::move(name))); } ///Write user data to the underlying XML element /** This conversion requires a specialization of zen::writeText() or zen::writeStruc() for type T. \tparam T User type that is converted into an XML element value. */ template void operator()(const T& value) { writeStruc(value, *ref_); } ///Write user data to an XML attribute /** This conversion requires a specialization of zen::writeText() for type T. \code zen::XmlDoc doc; zen::XmlOut out(doc); out["elem"].attribute("attr1", 1); // out["elem"].attribute("attr2", 2); //write data into XML attributes out["elem"].attribute("attr3", -3); // saveXml(doc, "out.xml"); //throw FileError \endcode Output: \verbatim \endverbatim \tparam T String-convertible user data type: e.g. any string-like type, all built-in arithmetic numbers \sa XmlElement::setAttribute() */ template void attribute(std::string name, const T& value) { ref_->setAttribute(std::move(name), value); } private: ///Construct an output proxy for a single XML element /** \sa XmlOut(XmlDoc& doc) */ explicit XmlOut(XmlElement& element) : ref_(&element) {} XmlElement* ref_; //always bound! }; ///Proxy class to conveniently convert XML structure to user data class XmlIn { class ErrorLog; public: ///Construct an input proxy for an XML document /** \code zen::XmlDoc doc; ... //load document zen::XmlIn in(doc); in["elem1"](value1); // in["elem2"](value2); //read data from XML elements into variables "value1", "value2", "value3" in["elem3"](value3); // \endcode */ explicit XmlIn(const XmlDoc& doc) : nodeNameFormatted_('<' + doc.root().getName() + '>') { refList_.push_back(&doc.root()); } ///Retrieve a handle to an XML child element for reading /** It is \b not an error if the child element does not exist, but only later if a conversion to user data is attempted. \param name The name of the child element */ XmlIn operator[](const std::string& name) const { std::vector childList; if (const XmlElement* elem = get()) { auto itPair = elem->getChildren(name); std::for_each(itPair.first, itPair.second, [&](const XmlElement& child) { childList.push_back(&child); }); } return XmlIn(childList, getChildNameFormatted(name), log_); } ///Refer to next sibling element with the same name /** Example: Loop over all XML child elements named "Item" \verbatim 1 3 5 \endverbatim \code zen::XmlIn in(doc); ... for (zen::XmlIn child = in["Item"]; child; child.next()) { ... } \endcode */ void next() { ++refIndex_; } ///Test whether the underlying XML element exists /** \code XmlIn in(doc); XmlIn child = in["elem1"]; if (child) ... \endcode Use member pointer as implicit conversion to bool (C++ Templates - Vandevoorde/Josuttis; chapter 20) */ explicit operator bool() const { return get() != nullptr; } ///Read user data from the underlying XML element /** This conversion requires a specialization of zen::readText() or zen::readStruc() for type T. \tparam T User type that receives the data \return "true" if data was read successfully */ template bool operator()(T& value) const { if (const XmlElement* elem = get()) { if (readStruc(*elem, value)) return true; log_.ref().notifyConversionError(getNameFormatted()); } else log_.ref().notifyMissingElement(getNameFormatted()); return false; } bool hasAttribute(const std::string& name) const { if (const XmlElement* elem = get()) if (elem->hasAttribute(name)) return true; return false; } ///Read user data from an XML attribute /** This conversion requires a specialization of zen::readText() for type T. \code zen::XmlDoc doc; ... //load document zen::XmlIn in(doc); in["elem"].attribute("attr1", value1); // in["elem"].attribute("attr2", value2); //read data from XML attributes into variables "value1", "value2", "value3" in["elem"].attribute("attr3", value3); // \endcode \tparam String Arbitrary string-like type: e.g. std::string, wchar_t*, char[], wchar_t, wxString, MyStringClass, ... \tparam T String-convertible user data type: e.g. any string-like type, all built-in arithmetic numbers \returns "true" if the attribute was found and the conversion to the output value was successful. \sa XmlElement::getAttribute() */ template bool attribute(const std::string& name, T& value) const { if (const XmlElement* elem = get()) { if (elem->getAttribute(name, value)) return true; log_.ref().notifyMissingAttribute(getNameFormatted(), name); } else log_.ref().notifyMissingElement(getNameFormatted()); return false; } ///Notifies errors while mapping the XML to user data /** Error logging is shared by each hiearchy of XmlIn proxy instances that are created from each other. Consequently it doesn't matter which instance you query for errors: \code XmlIn in(doc); XmlIn inItem = in["item1"]; int value = 0; inItem(value); //let's assume this conversion failed assert(in.haveErrors() == inItem.haveErrors()); assert(in.getErrorsAs() == inItem.getErrorsAs()); \endcode Note that error logging is \b NOT global, but owned by all instances of a hierarchy of XmlIn proxies. Therefore it's safe to use unrelated XmlIn proxies in multiple threads. \n\n However be aware that the chain of connected proxy instances will be broken once you call XmlIn::get() to retrieve the underlying pointer. Errors that occur when working with this pointer are not logged by the original set of related instances. */ ///Get a list of XML element and attribute names which failed to convert to user data. /** \returns A list of XML element and attribute names, empty list if no errors occured. */ std::vector getErrors() const { std::vector output; for (const std::string& str : log_.ref().elementList()) output.push_back(utfTo(str)); return output; } private: XmlIn(const std::vector& siblingList, const std::string& nodeNameFormatted, const SharedRef& sharedlog) : refList_(siblingList), nodeNameFormatted_(nodeNameFormatted), log_(sharedlog) {} ///Return a pointer to the underlying Xml element, may be nullptr const XmlElement* get() const { return refIndex_ < refList_.size() ? refList_[refIndex_] : nullptr; } std::string getNameFormatted() const //" " { if (refIndex_ == 0 && refList_.size() <= 1) return nodeNameFormatted_; else return nodeNameFormatted_ + '[' + numberTo(refIndex_ + 1) + ']'; } std::string getChildNameFormatted(const std::string& childName) const { return getNameFormatted() + " <" + childName + '>'; } class ErrorLog { public: void notifyConversionError (const std::string& displayName) { insert(displayName); } void notifyMissingElement (const std::string& displayName) { insert(displayName); } void notifyMissingAttribute(const std::string& displayName, const std::string& attribName) { insert(displayName + " @" + attribName); } const std::vector& elementList() const { return failedElements; } private: void insert(const std::string& newVal) { if (usedElements.insert(newVal).second) failedElements.push_back(newVal); } std::vector failedElements; //unique list of failed elements std::set usedElements; }; std::vector refList_; //all sibling elements with same name (all pointers bound!) size_t refIndex_ = 0; //this sibling's index in refList_ std::string nodeNameFormatted_; mutable SharedRef log_ = makeSharedRef(); }; ///Check XML input proxy for errors and map to FileError exception /** \param xmlInput XML input proxy \throw FileError */ inline void checkXmlMappingErrors(const XmlIn& xmlInput) //throw FileError { if (const std::vector& errors = xmlInput.getErrors(); !errors.empty()) { std::wstring msg = _("The following XML elements could not be read:") + L'\n'; for (const std::wstring& elem : errors) msg += L'\n' + elem; throw FileError(msg); } } } #endif //XML_H_349578228034572457454554