tagparser/matroska/matroskatagfield.cpp

308 lines
12 KiB
C++

#include "./matroskatagfield.h"
#include "./ebmlelement.h"
#include "./matroskacontainer.h"
#include "../exceptions.h"
#include <c++utilities/io/binarywriter.h>
#include <memory>
using namespace std;
using namespace CppUtilities;
namespace TagParser {
/*!
* \class TagParser::MatroskaTagField
* \brief The MatroskaTagField class is used by MatroskaTag to store the fields.
*/
/*!
* \brief Constructs a new MatroskaTagField.
*/
MatroskaTagField::MatroskaTagField()
{
}
/*!
* \brief Constructs a new MatroskaTagField with the specified \a id and \a value.
*/
MatroskaTagField::MatroskaTagField(const string &id, const TagValue &value)
: TagField<MatroskaTagField>(id, value)
{
}
/*!
* \brief Parses field information from the specified EbmlElement.
*
* The specified atom should be a simple tag element. These elements
* represents the fields of a MatroskaTag.
*
* \throws Throws std::ios_base::failure when an IO error occurs.
* \throws Throws TagParser::Failure or a derived exception when a parsing
* error occurs.
*/
void MatroskaTagField::reparse(EbmlElement &simpleTagElement, Diagnostics &diag, bool parseNestedFields)
{
string context("parsing Matroska tag field");
simpleTagElement.parse(diag);
bool tagDefaultFound = false, tagLanguageFound = false, tagLanguageIETFFound = false;
for (EbmlElement *child = simpleTagElement.firstChild(); child; child = child->nextSibling()) {
try {
child->parse(diag);
} catch (const Failure &) {
diag.emplace_back(DiagLevel::Critical, "Unable to parse children of \"SimpleTag\"-element.", context);
break;
}
switch (child->id()) {
case MatroskaIds::TagName:
if (id().empty()) {
setId(child->readString());
context = "parsing Matroska tag field " + id();
} else {
diag.emplace_back(DiagLevel::Warning,
"\"SimpleTag\"-element contains multiple \"TagName\"-elements. Surplus TagName elements will be ignored.", context);
}
break;
case MatroskaIds::TagString:
case MatroskaIds::TagBinary:
if (value().isEmpty()) {
unique_ptr<char[]> buffer = make_unique<char[]>(child->dataSize());
child->stream().seekg(static_cast<streamoff>(child->dataOffset()));
child->stream().read(buffer.get(), static_cast<streamoff>(child->dataSize()));
switch (child->id()) {
case MatroskaIds::TagString:
value().assignData(move(buffer), child->dataSize(), TagDataType::Text, TagTextEncoding::Utf8);
break;
case MatroskaIds::TagBinary:
value().assignData(move(buffer), child->dataSize(), TagDataType::Undefined);
break;
}
} else {
diag.emplace_back(DiagLevel::Warning,
"\"SimpleTag\"-element contains multiple \"TagString\"/\"TagBinary\"-elements. Surplus \"TagName\"/\"TagBinary\"-elements will "
"be ignored.",
context);
}
break;
case MatroskaIds::TagLanguage:
if (!tagLanguageFound) {
tagLanguageFound = true;
auto language = child->readString();
if (language != "und") {
value().locale().emplace_back(std::move(language), LocaleFormat::ISO_639_2_B);
}
} else {
diag.emplace_back(DiagLevel::Warning,
"\"SimpleTag\"-element contains multiple \"TagLanguage\"-elements. Surplus \"TagLanguage\"-elements will be ignored.", context);
}
break;
case MatroskaIds::TagLanguageIETF:
if (!tagLanguageIETFFound) {
tagLanguageIETFFound = true;
value().locale().emplace_back(child->readString(), LocaleFormat::BCP_47);
} else {
diag.emplace_back(DiagLevel::Warning,
"\"SimpleTag\"-element contains multiple \"TagLanguageIETF\"-elements. Surplus \"TagLanguageIETF\"-elements will be ignored.",
context);
}
break;
case MatroskaIds::TagDefault:
if (!tagDefaultFound) {
setDefault(child->readUInteger() > 0);
tagDefaultFound = true;
} else {
diag.emplace_back(DiagLevel::Warning,
"\"SimpleTag\"-element contains multiple \"TagDefault\" elements. Surplus \"TagDefault\"-elements will be ignored.", context);
}
break;
case MatroskaIds::SimpleTag:
if (parseNestedFields) {
nestedFields().emplace_back();
nestedFields().back().reparse(*child, diag, true);
} else {
diag.emplace_back(DiagLevel::Warning,
"Nested fields are currently not supported. Nested tags can not be displayed and will be discarded when rewriting the file.",
context);
}
break;
case EbmlIds::Crc32:
case EbmlIds::Void:
break;
default:
diag.emplace_back(DiagLevel::Warning,
argsToString(
"\"SimpleTag\"-element contains unknown element ", child->idToString(), " at ", child->startOffset(), ". It will be ignored."),
context);
}
}
}
/*!
* \brief Prepares making.
* \returns Returns a MatroskaTagFieldMaker object which can be used to actually make the field.
* \remarks The field must NOT be mutated after making is prepared when it is intended to actually
* make the field using the make method of the returned object.
* \throws Throws TagParser::Failure or a derived exception when a making
* error occurs.
*
* This method might be useful when it is necessary to know the size of the field before making it.
*/
MatroskaTagFieldMaker MatroskaTagField::prepareMaking(Diagnostics &diag)
{
static const string context("making Matroska \"SimpleTag\" element.");
// check whether ID is empty
if (id().empty()) {
diag.emplace_back(DiagLevel::Critical, "Can not make \"SimpleTag\" element with empty \"TagName\".", context);
throw InvalidDataException();
}
try {
return MatroskaTagFieldMaker(*this, diag);
} catch (const ConversionException &) {
diag.emplace_back(DiagLevel::Critical, "The assigned tag value can not be converted to be written appropriately.", context);
throw InvalidDataException();
}
}
/*!
* \brief Saves the field to the specified \a stream (makes a "SimpleTag" element). *
* \throws Throws std::ios_base::failure when an IO error occurs.
* \throws Throws TagParser::Failure or a derived exception when a making
* error occurs.
*/
void MatroskaTagField::make(ostream &stream, Diagnostics &diag)
{
prepareMaking(diag).make(stream);
}
/*!
* \brief Ensures the specified \a id is upper-case as recommended by the Matroska spec.
* \sa https://matroska.org/technical/tagging.html#tag-formatting
*/
void MatroskaTagField::normalizeId(std::string &id)
{
for (auto &c : id) {
if (c >= 'a' && c <= 'z') {
c -= 'a' - 'A';
}
}
}
/*!
* \class TagParser::MatroskaTagFieldMaker
* \brief The MatroskaTagFieldMaker class helps making tag fields.
* It allows to calculate the required size.
* \sa See MatroskaTagField::prepareMaking() for more information.
*/
/*!
* \brief Prepares making the specified \a field.
* \sa See MatroskaTagField::prepareMaking() for more information.
*/
MatroskaTagFieldMaker::MatroskaTagFieldMaker(MatroskaTagField &field, Diagnostics &diag)
: m_field(field)
, m_language(m_field.value().locale().abbreviatedName(LocaleFormat::ISO_639_2_B, LocaleFormat::Unknown))
, m_languageIETF(m_field.value().locale().abbreviatedName(LocaleFormat::BCP_47))
, m_isBinary(false)
{
try {
m_stringValue = m_field.value().toString();
} catch (const ConversionException &) {
diag.emplace_back(DiagLevel::Warning,
"The assigned tag value can not be converted to a string and is treated as binary value (which is likely not what you want since "
"official Matroska specifiecation doesn't list any binary fields).",
"making Matroska \"SimpleTag\" element.");
m_isBinary = true;
}
// compute size of the mandatory "TagLanguage" element (if there's no language set, the 3 byte long value "und" is used)
const auto languageSize = m_language.empty() ? 3 : m_language.size();
const auto languageElementSize = 2 + EbmlElement::calculateSizeDenotationLength(languageSize) + languageSize;
// compute size of the optional "TagLanguageIETF" element
const auto languageIETFElementSize
= m_languageIETF.empty() ? 0 : (2 + EbmlElement::calculateSizeDenotationLength(m_languageIETF.size()) + m_languageIETF.size());
// compute "SimpleTag" element size
m_simpleTagSize =
// "TagName" element
+2 + EbmlElement::calculateSizeDenotationLength(m_field.id().size())
+ m_field.id().size()
// language elements
+ languageElementSize
+ languageIETFElementSize
// "TagDefault" element
+ 2 + 1
+ 1
// "TagString" element
+ 2 + EbmlElement::calculateSizeDenotationLength(m_stringValue.size()) + m_stringValue.size();
// compute size of nested tags
for (auto &nestedField : field.nestedFields()) {
m_nestedMaker.emplace_back(nestedField.prepareMaking(diag));
m_simpleTagSize += m_nestedMaker.back().m_totalSize;
}
m_totalSize = 2 + EbmlElement::calculateSizeDenotationLength(m_simpleTagSize) + m_simpleTagSize;
}
/*!
* \brief Saves the field (specified when constructing the object) to the
* specified \a stream (makes a "SimpleTag" element). *
* \throws Throws std::ios_base::failure when an IO error occurs.
* \throws Throws Assumes the data is already validated and thus does NOT
* throw TagParser::Failure or a derived exception.
*/
void MatroskaTagFieldMaker::make(ostream &stream) const
{
BinaryWriter writer(&stream);
char buff[8];
// write "SimpleTag" element
writer.writeUInt16BE(MatroskaIds::SimpleTag);
std::uint8_t sizeDenotationLen = EbmlElement::makeSizeDenotation(m_simpleTagSize, buff);
stream.write(buff, sizeDenotationLen);
// write "TagName" element
writer.writeUInt16BE(MatroskaIds::TagName);
sizeDenotationLen = EbmlElement::makeSizeDenotation(m_field.id().size(), buff);
stream.write(buff, sizeDenotationLen);
stream.write(m_field.id().c_str(), static_cast<std::streamsize>(m_field.id().size()));
// write "TagLanguage" element
writer.writeUInt16BE(MatroskaIds::TagLanguage);
if (m_language.empty()) {
stream.put(static_cast<ostream::char_type>(0x80 | 3));
stream.write("und", 3);
} else {
sizeDenotationLen = EbmlElement::makeSizeDenotation(m_language.size(), buff);
stream.write(buff, sizeDenotationLen);
stream.write(m_language.data(), static_cast<std::streamsize>(m_language.size()));
}
// write "TagLanguageIETF" element
if (!m_languageIETF.empty()) {
writer.writeUInt16BE(MatroskaIds::TagLanguageIETF);
sizeDenotationLen = EbmlElement::makeSizeDenotation(m_languageIETF.size(), buff);
stream.write(buff, sizeDenotationLen);
stream.write(m_languageIETF.data(), static_cast<std::streamsize>(m_languageIETF.size()));
}
// write "TagDefault" element
writer.writeUInt16BE(MatroskaIds::TagDefault);
stream.put(static_cast<ostream::char_type>(0x80 | 1));
stream.put(m_field.isDefault() ? 1 : 0);
// write "TagString"/"TagBinary" element
if (m_isBinary) {
writer.writeUInt16BE(MatroskaIds::TagBinary);
sizeDenotationLen = EbmlElement::makeSizeDenotation(m_field.value().dataSize(), buff);
stream.write(buff, sizeDenotationLen);
stream.write(m_field.value().dataPointer(), static_cast<std::streamsize>(m_field.value().dataSize()));
} else {
writer.writeUInt16BE(MatroskaIds::TagString);
sizeDenotationLen = EbmlElement::makeSizeDenotation(m_stringValue.size(), buff);
stream.write(buff, sizeDenotationLen);
stream.write(m_stringValue.data(), static_cast<std::streamsize>(m_stringValue.size()));
}
// make nested tags
for (const auto &maker : m_nestedMaker) {
maker.make(stream);
}
}
} // namespace TagParser