普通文本  |  323行  |  10.25 KB

#include "xmpmeta/xml/deserializer_impl.h"

#include <algorithm>

#include "base/integral_types.h"
#include "android-base/logging.h"
#include "strings/numbers.h"
#include "xmpmeta/base64.h"
#include "xmpmeta/xml/const.h"
#include "xmpmeta/xml/search.h"
#include "xmpmeta/xml/utils.h"
#include "xmpmeta/xmp_parser.h"

namespace dynamic_depth {
namespace xmpmeta {
namespace xml {
namespace {

// Converts a string to a boolean value if bool_str is one of "false" or "true",
// regardless of letter casing.
bool BoolStringToBool(const string& bool_str, bool* value) {
  string bool_str_lower = bool_str;
  std::transform(bool_str_lower.begin(), bool_str_lower.end(),
                 bool_str_lower.begin(), ::tolower);
  if (bool_str_lower == "true") {
    *value = true;
    return true;
  }
  if (bool_str_lower == "false") {
    *value = false;
    return true;
  }
  return false;
}

// Search for an rdf:Seq node, if it hasn't already been set.
// parent_name is the name of the rdf:Seq node's parent.
xmlNodePtr FindSeqNode(const xmlNodePtr node, const string& prefix,
                       const string& parent_name) {
  xmlNodePtr parent_node =
      DepthFirstSearch(node, prefix.data(), parent_name.data());
  if (parent_node == nullptr) {
    LOG(WARNING) << "Node " << parent_name << " not found";
    return nullptr;
  }
  return GetFirstSeqElement(parent_node);
}

// Extracts the specified string attribute.
bool GetStringProperty(const xmlNodePtr node, const string& prefix,
                       const string& property, string* value) {
  const xmlDocPtr doc = node->doc;
  for (const _xmlAttr* attribute = node->properties; attribute != nullptr;
       attribute = attribute->next) {
    // If prefix is not empty, then the attribute's namespace must not be null.
    if (((attribute->ns && !prefix.empty() &&
          strcmp(FromXmlChar(attribute->ns->prefix), prefix.data()) == 0) ||
         prefix.empty()) &&
        strcmp(FromXmlChar(attribute->name), property.data()) == 0) {
      xmlChar* attribute_string =
          xmlNodeListGetString(doc, attribute->children, 1);
      *value = FromXmlChar(attribute_string);
      xmlFree(attribute_string);
      return true;
    }
  }
  return false;
}

// Reads the contents of a node.
// E.g. <prefix:node_name>Contents Here</prefix:node_name>
bool ReadNodeContent(const xmlNodePtr node, const string& prefix,
                     const string& node_name, string* value) {
  auto* element = DepthFirstSearch(node, prefix.data(), node_name.data());
  if (element == nullptr) {
    return false;
  }
  if (!prefix.empty() &&
      (element->ns == nullptr || element->ns->prefix == nullptr ||
       strcmp(FromXmlChar(element->ns->prefix), prefix.data()) != 0)) {
    return false;
  }
  xmlChar* node_content = xmlNodeGetContent(element);
  *value = FromXmlChar(node_content);
  free(node_content);
  return true;
}

// Reads the string value of a property from the given XML node.
bool ReadStringProperty(const xmlNodePtr node, const string& prefix,
                        const string& property, string* value) {
  if (node == nullptr) {
    return false;
  }
  if (property.empty()) {
    LOG(ERROR) << "Property not given";
    return false;
  }

  // Try parsing in the format <Node ... Prefix:Property="Value"/>
  bool success = GetStringProperty(node, prefix, property, value);
  if (!success) {
    // Try parsing in the format <Prefix:Property>Value</Prefix:Property>
    success = ReadNodeContent(node, prefix, property, value);
  }
  return success;
}

// Same as ReadStringProperty, but applies base-64 decoding to the output.
bool ReadBase64Property(const xmlNodePtr node, const string& prefix,
                        const string& property, string* value) {
  string base64_data;
  if (!ReadStringProperty(node, prefix, property, &base64_data)) {
    return false;
  }
  return DecodeBase64(base64_data, value);
}

}  // namespace

DeserializerImpl::DeserializerImpl(const xmlNodePtr node)
    : node_(node), list_node_(nullptr) {}

// Public methods.
std::unique_ptr<Deserializer> DeserializerImpl::CreateDeserializer(
    const string& prefix, const string& child_name) const {
  if (child_name.empty()) {
    LOG(ERROR) << "Child name is empty";
    return nullptr;
  }
  xmlNodePtr child_node =
      DepthFirstSearch(node_, prefix.data(), child_name.data());
  if (child_node == nullptr) {
    return nullptr;
  }
  return std::unique_ptr<Deserializer>(
      new DeserializerImpl(child_node));  // NOLINT
}

std::unique_ptr<Deserializer>
DeserializerImpl::CreateDeserializerFromListElementAt(const string& prefix,
                                                      const string& list_name,
                                                      int index) const {
  if (index < 0) {
    LOG(ERROR) << "Index must be greater than or equal to zero";
    return nullptr;
  }

  if (list_name.empty()) {
    LOG(ERROR) << "Parent name cannot be empty";
    return nullptr;
  }
  // Search for an rdf:Seq node, if the name of list_node_ doesn't match
  // the given parent name.
  // Ensures thread safety.
  const xmlNodePtr list_node = [&] {
    std::lock_guard<std::mutex> lock(mtx_);
    if (list_node_ == nullptr ||
        string(FromXmlChar(list_node_->name)) != list_name) {
      list_node_ = DepthFirstSearch(node_, prefix.data(), list_name.data());
    }
    return list_node_;
  }();
  if (list_node == nullptr) {
    return nullptr;
  }

  xmlNodePtr seq_node = GetFirstSeqElement(list_node);
  if (seq_node == nullptr) {
    LOG(ERROR) << "No rdf:Seq node found on " << list_name;
    return nullptr;
  }
  xmlNodePtr li_node = GetElementAt(seq_node, index);
  if (li_node == nullptr) {
    return nullptr;
  }
  // Return a new Deserializer with the current rdf:li node and the current
  // node name.
  return std::unique_ptr<Deserializer>(
      new DeserializerImpl(li_node));  // NOLINT
}

bool DeserializerImpl::ParseBase64(const string& prefix, const string& name,
                                   string* value) const {
  return ReadBase64Property(node_, prefix, name, value);
}

bool DeserializerImpl::ParseIntArrayBase64(const string& prefix,
                                           const string& name,
                                           std::vector<int>* values) const {
  string base64_data;
  if (!ReadStringProperty(node_, prefix, name, &base64_data)) {
    return false;
  }
  return DecodeIntArrayBase64(base64_data, values);
}

bool DeserializerImpl::ParseFloatArrayBase64(const string& prefix,
                                             const string& name,
                                             std::vector<float>* values) const {
  string base64_data;
  if (!ReadStringProperty(node_, prefix, name, &base64_data)) {
    return false;
  }
  return DecodeFloatArrayBase64(base64_data, values);
}

bool DeserializerImpl::ParseDoubleArrayBase64(
    const string& prefix, const string& name,
    std::vector<double>* values) const {
  string base64_data;
  if (!ReadStringProperty(node_, prefix, name, &base64_data)) {
    return false;
  }
  return DecodeDoubleArrayBase64(base64_data, values);
}

bool DeserializerImpl::ParseBoolean(const string& prefix, const string& name,
                                    bool* value) const {
  string string_value;
  if (!ReadStringProperty(node_, prefix, name, &string_value)) {
    return false;
  }
  return BoolStringToBool(string_value, value);
}

bool DeserializerImpl::ParseDouble(const string& prefix, const string& name,
                                   double* value) const {
  string string_value;
  if (!ReadStringProperty(node_, prefix, name, &string_value)) {
    return false;
  }
  *value = std::stod(string_value);
  return true;
}

bool DeserializerImpl::ParseInt(const string& prefix, const string& name,
                                int* value) const {
  string string_value;
  if (!ReadStringProperty(node_, prefix, name, &string_value)) {
    return false;
  }
  *value = std::stoi(string_value);  // NOLINT
  return true;
}

bool DeserializerImpl::ParseFloat(const string& prefix, const string& name,
                                  float* value) const {
  string string_value;
  if (!ReadStringProperty(node_, prefix, name, &string_value)) {
    return false;
  }
  *value = std::stof(string_value);
  return true;
}

bool DeserializerImpl::ParseLong(const string& prefix, const string& name,
                                 int64* value) const {
  string string_value;
  if (!ReadStringProperty(node_, prefix, name, &string_value)) {
    return false;
  }
  *value = std::stol(string_value);
  return true;
}

bool DeserializerImpl::ParseString(const string& prefix, const string& name,
                                   string* value) const {
  return ReadStringProperty(node_, prefix, name, value);
}

bool DeserializerImpl::ParseIntArray(const string& prefix,
                                     const string& list_name,
                                     std::vector<int>* values) const {
  xmlNodePtr seq_node = FindSeqNode(node_, prefix, list_name);
  if (seq_node == nullptr) {
    return false;
  }
  values->clear();
  int i = 0;
  for (xmlNodePtr li_node = GetElementAt(seq_node, 0); li_node != nullptr;
       li_node = GetElementAt(seq_node, ++i)) {
    string value = GetLiNodeContent(li_node);
    for (int i = 0; i < value.size(); ++i) {
      if (!isdigit(value[i])) {
        LOG(ERROR) << "Could not parse rdf:li node value to an integer";
        return false;
      }
    }
    int int_value = std::atoi(value.c_str());  // NOLINT
    values->push_back(int_value);
  }

  return true;
}

bool DeserializerImpl::ParseDoubleArray(const string& prefix,
                                        const string& list_name,
                                        std::vector<double>* values) const {
  xmlNodePtr seq_node = FindSeqNode(node_, prefix, list_name);
  if (seq_node == nullptr) {
    return false;
  }
  values->clear();
  int i = 0;
  for (xmlNodePtr li_node = GetElementAt(seq_node, 0); li_node != nullptr;
       li_node = GetElementAt(seq_node, ++i)) {
    double double_value;
    if (!dynamic_depth::strings::safe_strtod(GetLiNodeContent(li_node),
                                             &double_value)) {
      LOG(ERROR) << "Could not parse rdf:li node value to a double";
      return false;
    }
    values->push_back(double_value);
  }

  return true;
}

}  // namespace xml
}  // namespace xmpmeta
}  // namespace dynamic_depth