/*
* Copyright (C) 2017 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "compact_dex_writer.h"
#include "android-base/stringprintf.h"
#include "base/logging.h"
#include "base/time_utils.h"
#include "dex/compact_dex_file.h"
#include "dex/compact_offset_table.h"
#include "dexlayout.h"
namespace art {
CompactDexWriter::CompactDexWriter(DexLayout* dex_layout)
: DexWriter(dex_layout, /*compute_offsets*/ true) {
CHECK(GetCompactDexLevel() != CompactDexLevel::kCompactDexLevelNone);
}
CompactDexLevel CompactDexWriter::GetCompactDexLevel() const {
return dex_layout_->GetOptions().compact_dex_level_;
}
CompactDexWriter::Container::Container(bool dedupe_code_items)
: code_item_dedupe_(dedupe_code_items, &data_section_),
data_item_dedupe_(/*dedupe*/ true, &data_section_) {}
uint32_t CompactDexWriter::WriteDebugInfoOffsetTable(Stream* stream) {
const uint32_t start_offset = stream->Tell();
const dex_ir::Collections& collections = header_->GetCollections();
// Debug offsets for method indexes. 0 means no debug info.
std::vector<uint32_t> debug_info_offsets(collections.MethodIdsSize(), 0u);
static constexpr InvokeType invoke_types[] = {
kDirect,
kVirtual
};
for (InvokeType invoke_type : invoke_types) {
for (const std::unique_ptr<dex_ir::ClassDef>& class_def : collections.ClassDefs()) {
// Skip classes that are not defined in this dex file.
dex_ir::ClassData* class_data = class_def->GetClassData();
if (class_data == nullptr) {
continue;
}
for (auto& method : *(invoke_type == InvokeType::kDirect
? class_data->DirectMethods()
: class_data->VirtualMethods())) {
const dex_ir::MethodId* method_id = method->GetMethodId();
dex_ir::CodeItem* code_item = method->GetCodeItem();
if (code_item != nullptr && code_item->DebugInfo() != nullptr) {
const uint32_t debug_info_offset = code_item->DebugInfo()->GetOffset();
const uint32_t method_idx = method_id->GetIndex();
if (debug_info_offsets[method_idx] != 0u) {
CHECK_EQ(debug_info_offset, debug_info_offsets[method_idx]);
}
debug_info_offsets[method_idx] = debug_info_offset;
}
}
}
}
std::vector<uint8_t> data;
debug_info_base_ = 0u;
debug_info_offsets_table_offset_ = 0u;
CompactOffsetTable::Build(debug_info_offsets,
&data,
&debug_info_base_,
&debug_info_offsets_table_offset_);
// Align the table and write it out.
stream->AlignTo(CompactOffsetTable::kAlignment);
debug_info_offsets_pos_ = stream->Tell();
stream->Write(data.data(), data.size());
// Verify that the whole table decodes as expected and measure average performance.
const bool kMeasureAndTestOutput = dex_layout_->GetOptions().verify_output_;
if (kMeasureAndTestOutput && !debug_info_offsets.empty()) {
uint64_t start_time = NanoTime();
stream->Begin();
CompactOffsetTable::Accessor accessor(stream->Begin() + debug_info_offsets_pos_,
debug_info_base_,
debug_info_offsets_table_offset_);
for (size_t i = 0; i < debug_info_offsets.size(); ++i) {
CHECK_EQ(accessor.GetOffset(i), debug_info_offsets[i]);
}
uint64_t end_time = NanoTime();
VLOG(dex) << "Average lookup time (ns) for debug info offsets: "
<< (end_time - start_time) / debug_info_offsets.size();
}
return stream->Tell() - start_offset;
}
CompactDexWriter::ScopedDataSectionItem::ScopedDataSectionItem(Stream* stream,
dex_ir::Item* item,
size_t alignment,
Deduper* deduper)
: stream_(stream),
item_(item),
alignment_(alignment),
deduper_(deduper),
start_offset_(stream->Tell()) {
stream_->AlignTo(alignment_);
}
CompactDexWriter::ScopedDataSectionItem::~ScopedDataSectionItem() {
// After having written, maybe dedupe the whole code item (excluding padding).
const uint32_t deduped_offset = deduper_->Dedupe(start_offset_,
stream_->Tell(),
item_->GetOffset());
// If we deduped, only use the deduped offset if the alignment matches the required alignment.
// Otherwise, return without deduping.
if (deduped_offset != Deduper::kDidNotDedupe && IsAlignedParam(deduped_offset, alignment_)) {
// Update the IR offset to the offset of the deduped item.
item_->SetOffset(deduped_offset);
// Clear the written data for the item so that the stream write doesn't abort in the future.
stream_->Clear(start_offset_, stream_->Tell() - start_offset_);
// Since we deduped, restore the offset to the original position.
stream_->Seek(start_offset_);
}
}
size_t CompactDexWriter::ScopedDataSectionItem::Written() const {
return stream_->Tell() - start_offset_;
}
void CompactDexWriter::WriteCodeItem(Stream* stream,
dex_ir::CodeItem* code_item,
bool reserve_only) {
DCHECK(code_item != nullptr);
DCHECK(!reserve_only) << "Not supported because of deduping.";
ScopedDataSectionItem data_item(stream,
code_item,
CompactDexFile::CodeItem::kAlignment,
code_item_dedupe_);
CompactDexFile::CodeItem disk_code_item;
uint16_t preheader_storage[CompactDexFile::CodeItem::kMaxPreHeaderSize] = {};
uint16_t* preheader_end = preheader_storage + CompactDexFile::CodeItem::kMaxPreHeaderSize;
const uint16_t* preheader = disk_code_item.Create(
code_item->RegistersSize(),
code_item->InsSize(),
code_item->OutsSize(),
code_item->TriesSize(),
code_item->InsnsSize(),
preheader_end);
const size_t preheader_bytes = (preheader_end - preheader) * sizeof(preheader[0]);
static constexpr size_t kPayloadInstructionRequiredAlignment = 4;
const uint32_t current_code_item_start = stream->Tell() + preheader_bytes;
if (!IsAlignedParam(current_code_item_start, kPayloadInstructionRequiredAlignment) ||
kIsDebugBuild) {
// If the preheader is going to make the code unaligned, consider adding 2 bytes of padding
// before if required.
IterationRange<DexInstructionIterator> instructions = code_item->Instructions();
SafeDexInstructionIterator it(instructions.begin(), instructions.end());
for (; !it.IsErrorState() && it < instructions.end(); ++it) {
// In case the instruction goes past the end of the code item, make sure to not process it.
if (std::next(it).IsErrorState()) {
break;
}
const Instruction::Code opcode = it->Opcode();
// Payload instructions possibly require special alignment for their data.
if (opcode == Instruction::FILL_ARRAY_DATA ||
opcode == Instruction::PACKED_SWITCH ||
opcode == Instruction::SPARSE_SWITCH) {
stream->Skip(
RoundUp(current_code_item_start, kPayloadInstructionRequiredAlignment) -
current_code_item_start);
break;
}
}
}
// Write preheader first.
stream->Write(reinterpret_cast<const uint8_t*>(preheader), preheader_bytes);
// Registered offset is after the preheader.
ProcessOffset(stream, code_item);
// Avoid using sizeof so that we don't write the fake instruction array at the end of the code
// item.
stream->Write(&disk_code_item, OFFSETOF_MEMBER(CompactDexFile::CodeItem, insns_));
// Write the instructions.
stream->Write(code_item->Insns(), code_item->InsnsSize() * sizeof(uint16_t));
// Write the post instruction data.
WriteCodeItemPostInstructionData(stream, code_item, reserve_only);
}
void CompactDexWriter::WriteDebugInfoItem(Stream* stream, dex_ir::DebugInfoItem* debug_info) {
ScopedDataSectionItem data_item(stream,
debug_info,
SectionAlignment(DexFile::kDexTypeDebugInfoItem),
data_item_dedupe_);
ProcessOffset(stream, debug_info);
stream->Write(debug_info->GetDebugInfo(), debug_info->GetDebugInfoSize());
}
CompactDexWriter::Deduper::Deduper(bool enabled, DexContainer::Section* section)
: enabled_(enabled),
dedupe_map_(/*bucket_count*/ 32,
HashedMemoryRange::HashEqual(section),
HashedMemoryRange::HashEqual(section)) {}
uint32_t CompactDexWriter::Deduper::Dedupe(uint32_t data_start,
uint32_t data_end,
uint32_t item_offset) {
if (!enabled_) {
return kDidNotDedupe;
}
HashedMemoryRange range {data_start, data_end - data_start};
auto existing = dedupe_map_.emplace(range, item_offset);
if (!existing.second) {
// Failed to insert means we deduped, return the existing item offset.
return existing.first->second;
}
return kDidNotDedupe;
}
void CompactDexWriter::SortDebugInfosByMethodIndex() {
dex_ir::Collections& collections = header_->GetCollections();
static constexpr InvokeType invoke_types[] = {
kDirect,
kVirtual
};
std::map<const dex_ir::DebugInfoItem*, uint32_t> method_idx_map;
for (InvokeType invoke_type : invoke_types) {
for (std::unique_ptr<dex_ir::ClassDef>& class_def : collections.ClassDefs()) {
// Skip classes that are not defined in this dex file.
dex_ir::ClassData* class_data = class_def->GetClassData();
if (class_data == nullptr) {
continue;
}
for (auto& method : *(invoke_type == InvokeType::kDirect
? class_data->DirectMethods()
: class_data->VirtualMethods())) {
const dex_ir::MethodId* method_id = method->GetMethodId();
dex_ir::CodeItem* code_item = method->GetCodeItem();
if (code_item != nullptr && code_item->DebugInfo() != nullptr) {
const dex_ir::DebugInfoItem* debug_item = code_item->DebugInfo();
method_idx_map.insert(std::make_pair(debug_item, method_id->GetIndex()));
}
}
}
}
std::sort(collections.DebugInfoItems().begin(),
collections.DebugInfoItems().end(),
[&](const std::unique_ptr<dex_ir::DebugInfoItem>& a,
const std::unique_ptr<dex_ir::DebugInfoItem>& b) {
auto it_a = method_idx_map.find(a.get());
auto it_b = method_idx_map.find(b.get());
uint32_t idx_a = it_a != method_idx_map.end() ? it_a->second : 0u;
uint32_t idx_b = it_b != method_idx_map.end() ? it_b->second : 0u;
return idx_a < idx_b;
});
}
void CompactDexWriter::WriteHeader(Stream* stream) {
CompactDexFile::Header header;
CompactDexFile::WriteMagic(&header.magic_[0]);
CompactDexFile::WriteCurrentVersion(&header.magic_[0]);
header.checksum_ = header_->Checksum();
std::copy_n(header_->Signature(), DexFile::kSha1DigestSize, header.signature_);
header.file_size_ = header_->FileSize();
// Since we are not necessarily outputting the same format as the input, avoid using the stored
// header size.
header.header_size_ = GetHeaderSize();
header.endian_tag_ = header_->EndianTag();
header.link_size_ = header_->LinkSize();
header.link_off_ = header_->LinkOffset();
const dex_ir::Collections& collections = header_->GetCollections();
header.map_off_ = collections.MapListOffset();
header.string_ids_size_ = collections.StringIdsSize();
header.string_ids_off_ = collections.StringIdsOffset();
header.type_ids_size_ = collections.TypeIdsSize();
header.type_ids_off_ = collections.TypeIdsOffset();
header.proto_ids_size_ = collections.ProtoIdsSize();
header.proto_ids_off_ = collections.ProtoIdsOffset();
header.field_ids_size_ = collections.FieldIdsSize();
header.field_ids_off_ = collections.FieldIdsOffset();
header.method_ids_size_ = collections.MethodIdsSize();
header.method_ids_off_ = collections.MethodIdsOffset();
header.class_defs_size_ = collections.ClassDefsSize();
header.class_defs_off_ = collections.ClassDefsOffset();
header.data_size_ = header_->DataSize();
header.data_off_ = header_->DataOffset();
header.owned_data_begin_ = owned_data_begin_;
header.owned_data_end_ = owned_data_end_;
// Compact dex specific flags.
header.debug_info_offsets_pos_ = debug_info_offsets_pos_;
header.debug_info_offsets_table_offset_ = debug_info_offsets_table_offset_;
header.debug_info_base_ = debug_info_base_;
header.feature_flags_ = 0u;
// In cases where apps are converted to cdex during install, maintain feature flags so that
// the verifier correctly verifies apps that aren't targetting default methods.
if (header_->SupportDefaultMethods()) {
header.feature_flags_ |= static_cast<uint32_t>(CompactDexFile::FeatureFlags::kDefaultMethods);
}
stream->Seek(0);
stream->Overwrite(reinterpret_cast<uint8_t*>(&header), sizeof(header));
}
size_t CompactDexWriter::GetHeaderSize() const {
return sizeof(CompactDexFile::Header);
}
void CompactDexWriter::WriteStringData(Stream* stream, dex_ir::StringData* string_data) {
ScopedDataSectionItem data_item(stream,
string_data,
SectionAlignment(DexFile::kDexTypeStringDataItem),
data_item_dedupe_);
ProcessOffset(stream, string_data);
stream->WriteUleb128(CountModifiedUtf8Chars(string_data->Data()));
stream->Write(string_data->Data(), strlen(string_data->Data()));
// Skip null terminator (already zeroed out, no need to write).
stream->Skip(1);
}
bool CompactDexWriter::CanGenerateCompactDex(std::string* error_msg) {
dex_ir::Collections& collections = header_->GetCollections();
static constexpr InvokeType invoke_types[] = {
kDirect,
kVirtual
};
std::vector<bool> saw_method_id(collections.MethodIdsSize(), false);
std::vector<dex_ir::CodeItem*> method_id_code_item(collections.MethodIdsSize(), nullptr);
std::vector<dex_ir::DebugInfoItem*> method_id_debug_info(collections.MethodIdsSize(), nullptr);
for (InvokeType invoke_type : invoke_types) {
for (std::unique_ptr<dex_ir::ClassDef>& class_def : collections.ClassDefs()) {
// Skip classes that are not defined in this dex file.
dex_ir::ClassData* class_data = class_def->GetClassData();
if (class_data == nullptr) {
continue;
}
for (auto& method : *(invoke_type == InvokeType::kDirect
? class_data->DirectMethods()
: class_data->VirtualMethods())) {
const uint32_t idx = method->GetMethodId()->GetIndex();
dex_ir::CodeItem* code_item = method->GetCodeItem();
dex_ir:: DebugInfoItem* debug_info_item = nullptr;
if (code_item != nullptr) {
debug_info_item = code_item->DebugInfo();
}
if (saw_method_id[idx]) {
if (method_id_code_item[idx] != code_item) {
*error_msg = android::base::StringPrintf("Conflicting code item for method id %u",
idx);
// Conflicting info, abort generation.
return false;
}
if (method_id_debug_info[idx] != debug_info_item) {
*error_msg = android::base::StringPrintf("Conflicting debug info for method id %u",
idx);
// Conflicting info, abort generation.
return false;
}
}
method_id_code_item[idx] = code_item;
method_id_debug_info[idx] = debug_info_item;
saw_method_id[idx] = true;
}
}
}
return true;
}
bool CompactDexWriter::Write(DexContainer* output, std::string* error_msg) {
DCHECK(error_msg != nullptr);
CHECK(compute_offsets_);
CHECK(output->IsCompactDexContainer());
if (!CanGenerateCompactDex(error_msg)) {
return false;
}
Container* const container = down_cast<Container*>(output);
// For now, use the same stream for both data and metadata.
Stream temp_main_stream(output->GetMainSection());
CHECK_EQ(output->GetMainSection()->Size(), 0u);
Stream temp_data_stream(output->GetDataSection());
Stream* main_stream = &temp_main_stream;
Stream* data_stream = &temp_data_stream;
// We want offset 0 to be reserved for null, seek to the data section alignment or the end of the
// section.
data_stream->Seek(std::max(
static_cast<uint32_t>(output->GetDataSection()->Size()),
kDataSectionAlignment));
code_item_dedupe_ = &container->code_item_dedupe_;
data_item_dedupe_ = &container->data_item_dedupe_;
// Starting offset is right after the header.
main_stream->Seek(GetHeaderSize());
dex_ir::Collections& collection = header_->GetCollections();
// Based on: https://source.android.com/devices/tech/dalvik/dex-format
// Since the offsets may not be calculated already, the writing must be done in the correct order.
const uint32_t string_ids_offset = main_stream->Tell();
WriteStringIds(main_stream, /*reserve_only*/ true);
WriteTypeIds(main_stream);
const uint32_t proto_ids_offset = main_stream->Tell();
WriteProtoIds(main_stream, /*reserve_only*/ true);
WriteFieldIds(main_stream);
WriteMethodIds(main_stream);
const uint32_t class_defs_offset = main_stream->Tell();
WriteClassDefs(main_stream, /*reserve_only*/ true);
const uint32_t call_site_ids_offset = main_stream->Tell();
WriteCallSiteIds(main_stream, /*reserve_only*/ true);
WriteMethodHandles(main_stream);
if (compute_offsets_) {
// Data section.
data_stream->AlignTo(kDataSectionAlignment);
}
owned_data_begin_ = data_stream->Tell();
// Write code item first to minimize the space required for encoded methods.
// For cdex, the code items don't depend on the debug info.
WriteCodeItems(data_stream, /*reserve_only*/ false);
// Sort the debug infos by method index order, this reduces size by ~0.1% by reducing the size of
// the debug info offset table.
SortDebugInfosByMethodIndex();
WriteDebugInfoItems(data_stream);
WriteEncodedArrays(data_stream);
WriteAnnotations(data_stream);
WriteAnnotationSets(data_stream);
WriteAnnotationSetRefs(data_stream);
WriteAnnotationsDirectories(data_stream);
WriteTypeLists(data_stream);
WriteClassDatas(data_stream);
WriteStringDatas(data_stream);
// Write delayed id sections that depend on data sections.
{
Stream::ScopedSeek seek(main_stream, string_ids_offset);
WriteStringIds(main_stream, /*reserve_only*/ false);
}
{
Stream::ScopedSeek seek(main_stream, proto_ids_offset);
WriteProtoIds(main_stream, /*reserve_only*/ false);
}
{
Stream::ScopedSeek seek(main_stream, class_defs_offset);
WriteClassDefs(main_stream, /*reserve_only*/ false);
}
{
Stream::ScopedSeek seek(main_stream, call_site_ids_offset);
WriteCallSiteIds(main_stream, /*reserve_only*/ false);
}
// Write the map list.
if (compute_offsets_) {
data_stream->AlignTo(SectionAlignment(DexFile::kDexTypeMapList));
collection.SetMapListOffset(data_stream->Tell());
} else {
data_stream->Seek(collection.MapListOffset());
}
// Map items are included in the data section.
GenerateAndWriteMapItems(data_stream);
// Write link data if it exists.
const std::vector<uint8_t>& link_data = collection.LinkData();
if (link_data.size() > 0) {
CHECK_EQ(header_->LinkSize(), static_cast<uint32_t>(link_data.size()));
if (compute_offsets_) {
header_->SetLinkOffset(data_stream->Tell());
} else {
data_stream->Seek(header_->LinkOffset());
}
data_stream->Write(&link_data[0], link_data.size());
}
// Write debug info offset table last to make dex file verifier happy.
WriteDebugInfoOffsetTable(data_stream);
data_stream->AlignTo(kDataSectionAlignment);
owned_data_end_ = data_stream->Tell();
if (compute_offsets_) {
header_->SetDataSize(data_stream->Tell());
if (header_->DataSize() != 0) {
// Offset must be zero when the size is zero.
main_stream->AlignTo(kDataSectionAlignment);
// For now, default to saying the data is right after the main stream.
header_->SetDataOffset(main_stream->Tell());
} else {
header_->SetDataOffset(0u);
}
}
// Write header last.
if (compute_offsets_) {
header_->SetFileSize(main_stream->Tell());
}
WriteHeader(main_stream);
// Trim sections to make sure they are sized properly.
output->GetMainSection()->Resize(header_->FileSize());
output->GetDataSection()->Resize(data_stream->Tell());
if (dex_layout_->GetOptions().update_checksum_) {
// Compute the cdex section (also covers the used part of the data section).
header_->SetChecksum(CompactDexFile::CalculateChecksum(output->GetMainSection()->Begin(),
output->GetMainSection()->Size(),
output->GetDataSection()->Begin(),
output->GetDataSection()->Size()));
// Rewrite the header with the calculated checksum.
WriteHeader(main_stream);
}
// Clear the dedupe to prevent interdex code item deduping. This does not currently work well with
// dex2oat's class unloading. The issue is that verification encounters quickened opcodes after
// the first dex gets unloaded.
code_item_dedupe_->Clear();
return true;
}
std::unique_ptr<DexContainer> CompactDexWriter::CreateDexContainer() const {
return std::unique_ptr<DexContainer>(
new CompactDexWriter::Container(dex_layout_->GetOptions().dedupe_code_items_));
}
} // namespace art