普通文本  |  191行  |  6.46 KB

/*
 * Copyright (C) 2018 The Android Open Source Project
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

#include "utils/zlib/zlib.h"

#include "utils/flatbuffers.h"

namespace libtextclassifier3 {

std::unique_ptr<ZlibDecompressor> ZlibDecompressor::Instance(
    const unsigned char* dictionary, const unsigned int dictionary_size) {
  std::unique_ptr<ZlibDecompressor> result(
      new ZlibDecompressor(dictionary, dictionary_size));
  if (!result->initialized_) {
    result.reset();
  }
  return result;
}

ZlibDecompressor::ZlibDecompressor(const unsigned char* dictionary,
                                   const unsigned int dictionary_size) {
  memset(&stream_, 0, sizeof(stream_));
  stream_.zalloc = Z_NULL;
  stream_.zfree = Z_NULL;
  initialized_ = false;
  if (inflateInit(&stream_) != Z_OK) {
    TC3_LOG(ERROR) << "Could not initialize decompressor.";
    return;
  }
  if (dictionary != nullptr &&
      inflateSetDictionary(&stream_, dictionary, dictionary_size) != Z_OK) {
    TC3_LOG(ERROR) << "Could not set dictionary.";
    return;
  }
  initialized_ = true;
}

ZlibDecompressor::~ZlibDecompressor() {
  if (initialized_) {
    inflateEnd(&stream_);
  }
}

bool ZlibDecompressor::Decompress(const uint8* buffer, const int buffer_size,
                                  const int uncompressed_size,
                                  std::string* out) {
  if (out == nullptr) {
    return false;
  }
  out->resize(uncompressed_size);
  stream_.next_in = reinterpret_cast<const Bytef*>(buffer);
  stream_.avail_in = buffer_size;
  stream_.next_out = reinterpret_cast<Bytef*>(const_cast<char*>(out->c_str()));
  stream_.avail_out = uncompressed_size;
  return (inflate(&stream_, Z_SYNC_FLUSH) == Z_OK);
}

bool ZlibDecompressor::MaybeDecompress(
    const CompressedBuffer* compressed_buffer, std::string* out) {
  if (!compressed_buffer) {
    return true;
  }
  return Decompress(compressed_buffer->buffer()->Data(),
                    compressed_buffer->buffer()->size(),
                    compressed_buffer->uncompressed_size(), out);
}

bool ZlibDecompressor::MaybeDecompress(
    const CompressedBufferT* compressed_buffer, std::string* out) {
  if (!compressed_buffer) {
    return true;
  }
  return Decompress(compressed_buffer->buffer.data(),
                    compressed_buffer->buffer.size(),
                    compressed_buffer->uncompressed_size, out);
}

bool ZlibDecompressor::MaybeDecompressOptionallyCompressedBuffer(
    const flatbuffers::String* uncompressed_buffer,
    const CompressedBuffer* compressed_buffer, std::string* out) {
  if (uncompressed_buffer != nullptr) {
    *out = uncompressed_buffer->str();
    return true;
  }
  return MaybeDecompress(compressed_buffer, out);
}

bool ZlibDecompressor::MaybeDecompressOptionallyCompressedBuffer(
    const flatbuffers::Vector<uint8>* uncompressed_buffer,
    const CompressedBuffer* compressed_buffer, std::string* out) {
  if (uncompressed_buffer != nullptr) {
    *out =
        std::string(reinterpret_cast<const char*>(uncompressed_buffer->data()),
                    uncompressed_buffer->size());
    return true;
  }
  return MaybeDecompress(compressed_buffer, out);
}

std::unique_ptr<ZlibCompressor> ZlibCompressor::Instance(
    const unsigned char* dictionary, const unsigned int dictionary_size) {
  std::unique_ptr<ZlibCompressor> result(
      new ZlibCompressor(dictionary, dictionary_size));
  if (!result->initialized_) {
    result.reset();
  }
  return result;
}

ZlibCompressor::ZlibCompressor(const unsigned char* dictionary,
                               const unsigned int dictionary_size,
                               const int level, const int tmp_buffer_size) {
  memset(&stream_, 0, sizeof(stream_));
  stream_.zalloc = Z_NULL;
  stream_.zfree = Z_NULL;
  buffer_size_ = tmp_buffer_size;
  buffer_.reset(new Bytef[buffer_size_]);
  initialized_ = false;
  if (deflateInit(&stream_, level) != Z_OK) {
    TC3_LOG(ERROR) << "Could not initialize compressor.";
    return;
  }
  if (dictionary != nullptr &&
      deflateSetDictionary(&stream_, dictionary, dictionary_size) != Z_OK) {
    TC3_LOG(ERROR) << "Could not set dictionary.";
    return;
  }
  initialized_ = true;
}

ZlibCompressor::~ZlibCompressor() { deflateEnd(&stream_); }

void ZlibCompressor::Compress(const std::string& uncompressed_content,
                              CompressedBufferT* out) {
  out->uncompressed_size = uncompressed_content.size();
  out->buffer.clear();
  stream_.next_in =
      reinterpret_cast<const Bytef*>(uncompressed_content.c_str());
  stream_.avail_in = uncompressed_content.size();
  stream_.next_out = buffer_.get();
  stream_.avail_out = buffer_size_;
  unsigned char* buffer_deflate_start_position =
      reinterpret_cast<unsigned char*>(buffer_.get());
  int status;
  do {
    // Deflate chunk-wise.
    // Z_SYNC_FLUSH causes all pending output to be flushed, but doesn't
    // reset the compression state.
    // As we do not know how big the compressed buffer will be, we compress
    // chunk wise and append the flushed content to the output string buffer.
    // As we store the uncompressed size, we do not have to do this during
    // decompression.
    status = deflate(&stream_, Z_SYNC_FLUSH);
    unsigned char* buffer_deflate_end_position =
        reinterpret_cast<unsigned char*>(stream_.next_out);
    if (buffer_deflate_end_position != buffer_deflate_start_position) {
      out->buffer.insert(out->buffer.end(), buffer_deflate_start_position,
                         buffer_deflate_end_position);
      stream_.next_out = buffer_deflate_start_position;
      stream_.avail_out = buffer_size_;
    } else {
      break;
    }
  } while (status == Z_OK);
}

bool ZlibCompressor::GetDictionary(std::vector<unsigned char>* dictionary) {
  // Retrieve first the size of the dictionary.
  unsigned int size;
  if (deflateGetDictionary(&stream_, /*dictionary=*/Z_NULL, &size) != Z_OK) {
    return false;
  }
  dictionary->resize(size);
  return deflateGetDictionary(&stream_, dictionary->data(), &size) == Z_OK;
}

}  // namespace libtextclassifier3