/*
* Copyright (C) 2016 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef ART_COMPILER_DEBUG_ELF_DEBUG_LINE_WRITER_H_
#define ART_COMPILER_DEBUG_ELF_DEBUG_LINE_WRITER_H_
#include <unordered_set>
#include <vector>
#include "debug/elf_compilation_unit.h"
#include "debug/src_map_elem.h"
#include "dex/dex_file-inl.h"
#include "dwarf/debug_line_opcode_writer.h"
#include "dwarf/headers.h"
#include "elf/elf_builder.h"
#include "oat_file.h"
#include "stack_map.h"
namespace art {
namespace debug {
typedef std::vector<DexFile::PositionInfo> PositionInfos;
template<typename ElfTypes>
class ElfDebugLineWriter {
using Elf_Addr = typename ElfTypes::Addr;
public:
explicit ElfDebugLineWriter(ElfBuilder<ElfTypes>* builder) : builder_(builder) {
}
void Start() {
builder_->GetDebugLine()->Start();
}
// Write line table for given set of methods.
// Returns the number of bytes written.
size_t WriteCompilationUnit(ElfCompilationUnit& compilation_unit) {
const InstructionSet isa = builder_->GetIsa();
const bool is64bit = Is64BitInstructionSet(isa);
const Elf_Addr base_address = compilation_unit.is_code_address_text_relative
? builder_->GetText()->GetAddress()
: 0;
compilation_unit.debug_line_offset = builder_->GetDebugLine()->GetPosition();
std::vector<dwarf::FileEntry> files;
std::unordered_map<std::string, size_t> files_map;
std::vector<std::string> directories;
std::unordered_map<std::string, size_t> directories_map;
int code_factor_bits_ = 0;
int dwarf_isa = -1;
switch (isa) {
case InstructionSet::kArm: // arm actually means thumb2.
case InstructionSet::kThumb2:
code_factor_bits_ = 1; // 16-bit instuctions
dwarf_isa = 1; // DW_ISA_ARM_thumb.
break;
case InstructionSet::kArm64:
case InstructionSet::kMips:
case InstructionSet::kMips64:
code_factor_bits_ = 2; // 32-bit instructions
break;
case InstructionSet::kNone:
case InstructionSet::kX86:
case InstructionSet::kX86_64:
break;
}
std::unordered_set<uint64_t> seen_addresses(compilation_unit.methods.size());
dwarf::DebugLineOpCodeWriter<> opcodes(is64bit, code_factor_bits_);
for (const MethodDebugInfo* mi : compilation_unit.methods) {
// Ignore function if we have already generated line table for the same address.
// It would confuse the debugger and the DWARF specification forbids it.
// We allow the line table for method to be replicated in different compilation unit.
// This ensures that each compilation unit contains line table for all its methods.
if (!seen_addresses.insert(mi->code_address).second) {
continue;
}
uint32_t prologue_end = std::numeric_limits<uint32_t>::max();
std::vector<SrcMapElem> pc2dex_map;
if (mi->code_info != nullptr) {
// Use stack maps to create mapping table from pc to dex.
const CodeInfo code_info(mi->code_info);
pc2dex_map.reserve(code_info.GetNumberOfStackMaps());
for (StackMap stack_map : code_info.GetStackMaps()) {
const uint32_t pc = stack_map.GetNativePcOffset(isa);
const int32_t dex = stack_map.GetDexPc();
pc2dex_map.push_back({pc, dex});
if (stack_map.HasDexRegisterMap()) {
// Guess that the first map with local variables is the end of prologue.
prologue_end = std::min(prologue_end, pc);
}
}
std::sort(pc2dex_map.begin(), pc2dex_map.end());
}
if (pc2dex_map.empty()) {
continue;
}
// Compensate for compiler's off-by-one-instruction error.
//
// The compiler generates stackmap with PC *after* the branch instruction
// (because this is the PC which is easier to obtain when unwinding).
//
// However, the debugger is more clever and it will ask us for line-number
// mapping at the location of the branch instruction (since the following
// instruction could belong to other line, this is the correct thing to do).
//
// So we really want to just decrement the PC by one instruction so that the
// branch instruction is covered as well. However, we do not know the size
// of the previous instruction, and we can not subtract just a fixed amount
// (the debugger would trust us that the PC is valid; it might try to set
// breakpoint there at some point, and setting breakpoint in mid-instruction
// would make the process crash in spectacular way).
//
// Therefore, we say that the PC which the compiler gave us for the stackmap
// is the end of its associated address range, and we use the PC from the
// previous stack map as the start of the range. This ensures that the PC is
// valid and that the branch instruction is covered.
//
// This ensures we have correct line number mapping at call sites (which is
// important for backtraces), but there is nothing we can do for non-call
// sites (so stepping through optimized code in debugger is not possible).
//
// We do not adjust the stackmaps if the code was compiled as debuggable.
// In that case, the stackmaps should accurately cover all instructions.
if (!mi->is_native_debuggable) {
for (size_t i = pc2dex_map.size() - 1; i > 0; --i) {
pc2dex_map[i].from_ = pc2dex_map[i - 1].from_;
}
pc2dex_map[0].from_ = 0;
}
Elf_Addr method_address = base_address + mi->code_address;
PositionInfos dex2line_map;
const DexFile* dex = mi->dex_file;
DCHECK(dex != nullptr);
CodeItemDebugInfoAccessor accessor(*dex, mi->code_item, mi->dex_method_index);
if (!accessor.DecodeDebugPositionInfo(
[&](const DexFile::PositionInfo& entry) {
dex2line_map.push_back(entry);
return false;
})) {
continue;
}
if (dex2line_map.empty()) {
continue;
}
opcodes.SetAddress(method_address);
if (dwarf_isa != -1) {
opcodes.SetISA(dwarf_isa);
}
// Get and deduplicate directory and filename.
int file_index = 0; // 0 - primary source file of the compilation.
auto& dex_class_def = dex->GetClassDef(mi->class_def_index);
const char* source_file = dex->GetSourceFile(dex_class_def);
if (source_file != nullptr) {
std::string file_name(source_file);
size_t file_name_slash = file_name.find_last_of('/');
std::string class_name(dex->GetClassDescriptor(dex_class_def));
size_t class_name_slash = class_name.find_last_of('/');
std::string full_path(file_name);
// Guess directory from package name.
int directory_index = 0; // 0 - current directory of the compilation.
if (file_name_slash == std::string::npos && // Just filename.
class_name.front() == 'L' && // Type descriptor for a class.
class_name_slash != std::string::npos) { // Has package name.
std::string package_name = class_name.substr(1, class_name_slash - 1);
auto it = directories_map.find(package_name);
if (it == directories_map.end()) {
directory_index = 1 + directories.size();
directories_map.emplace(package_name, directory_index);
directories.push_back(package_name);
} else {
directory_index = it->second;
}
full_path = package_name + "/" + file_name;
}
// Add file entry.
auto it2 = files_map.find(full_path);
if (it2 == files_map.end()) {
file_index = 1 + files.size();
files_map.emplace(full_path, file_index);
files.push_back(dwarf::FileEntry {
file_name,
directory_index,
0, // Modification time - NA.
0, // File size - NA.
});
} else {
file_index = it2->second;
}
}
opcodes.SetFile(file_index);
// Generate mapping opcodes from PC to Java lines.
if (file_index != 0) {
// If the method was not compiled as native-debuggable, we still generate all available
// lines, but we try to prevent the debugger from stepping and setting breakpoints since
// the information is too inaccurate for that (breakpoints would be set after the calls).
const bool default_is_stmt = mi->is_native_debuggable;
bool first = true;
for (SrcMapElem pc2dex : pc2dex_map) {
uint32_t pc = pc2dex.from_;
int dex_pc = pc2dex.to_;
// Find mapping with address with is greater than our dex pc; then go back one step.
auto dex2line = std::upper_bound(
dex2line_map.begin(),
dex2line_map.end(),
dex_pc,
[](uint32_t address, const DexFile::PositionInfo& entry) {
return address < entry.address_;
});
// Look for first valid mapping after the prologue.
if (dex2line != dex2line_map.begin() && pc >= prologue_end) {
int line = (--dex2line)->line_;
if (first) {
first = false;
if (pc > 0) {
// Assume that any preceding code is prologue.
int first_line = dex2line_map.front().line_;
// Prologue is not a sensible place for a breakpoint.
opcodes.SetIsStmt(false);
opcodes.AddRow(method_address, first_line);
opcodes.SetPrologueEnd();
}
opcodes.SetIsStmt(default_is_stmt);
opcodes.AddRow(method_address + pc, line);
} else if (line != opcodes.CurrentLine()) {
opcodes.SetIsStmt(default_is_stmt);
opcodes.AddRow(method_address + pc, line);
}
}
}
} else {
// line 0 - instruction cannot be attributed to any source line.
opcodes.AddRow(method_address, 0);
}
opcodes.AdvancePC(method_address + mi->code_size);
opcodes.EndSequence();
}
std::vector<uint8_t> buffer;
buffer.reserve(opcodes.data()->size() + KB);
WriteDebugLineTable(directories, files, opcodes, &buffer);
builder_->GetDebugLine()->WriteFully(buffer.data(), buffer.size());
return buffer.size();
}
void End() {
builder_->GetDebugLine()->End();
}
private:
ElfBuilder<ElfTypes>* builder_;
};
} // namespace debug
} // namespace art
#endif // ART_COMPILER_DEBUG_ELF_DEBUG_LINE_WRITER_H_