path: root/lib
diff options
authorStephen Hines <>2014-09-02 22:01:35 +0000
committerGerrit Code Review <>2014-09-02 22:01:36 +0000
commit7488ffd672ad1146d8a615f03a96a79794cd0d73 (patch)
tree31bc36cdf3d95d6506d578bb21e21201eaee2347 /lib
parente673be8f0526f9cbc83093fb579c0f76de9e4e3c (diff)
parentb3323086ee04f9db9e85f7cae46510f91a137237 (diff)
Merge "Fix mclinker build based on the current merge point (6824c79120)."android-l-preview_r2l-preview
Diffstat (limited to 'lib')
3 files changed, 308 insertions, 0 deletions
diff --git a/lib/LD/ b/lib/LD/
index 4bfafd7..49a35cf 100644
--- a/lib/LD/
+++ b/lib/LD/
@@ -25,6 +25,7 @@ mcld_ld_SRC_FILES := \
EhFrameReader.cpp \
GarbageCollection.cpp \
GroupReader.cpp \
+ IdenticalCodeFolding.cpp \
LDContext.cpp \
LDFileFormat.cpp \
LDReader.cpp \
@@ -48,6 +49,7 @@ mcld_ld_SRC_FILES := \
# =====================================================
include $(CLEAR_VARS)
+LOCAL_C_INCLUDES += external/zlib
@@ -60,6 +62,7 @@ include $(BUILD_HOST_STATIC_LIBRARY)
# =====================================================
include $(CLEAR_VARS)
+LOCAL_C_INCLUDES += external/zlib
diff --git a/lib/LD/IdenticalCodeFolding.cpp b/lib/LD/IdenticalCodeFolding.cpp
new file mode 100644
index 0000000..b3ba59d
--- /dev/null
+++ b/lib/LD/IdenticalCodeFolding.cpp
@@ -0,0 +1,304 @@
+//===- IndenticalCodeFolding.cpp ------------------------------------------===//
+// The MCLinker Project
+// This file is distributed under the University of Illinois Open Source
+// License. See LICENSE.TXT for details.
+#include <mcld/Fragment/RegionFragment.h>
+#include <mcld/LD/IdenticalCodeFolding.h>
+#include <mcld/LD/LDContext.h>
+#include <mcld/LD/LDSection.h>
+#include <mcld/LD/RelocData.h>
+#include <mcld/LD/Relocator.h>
+#include <mcld/LD/ResolveInfo.h>
+#include <mcld/LD/SectionData.h>
+#include <mcld/LinkerConfig.h>
+#include <mcld/MC/Input.h>
+#include <mcld/GeneralOptions.h>
+#include <mcld/Module.h>
+#include <mcld/Support/Demangle.h>
+#include <mcld/Support/MsgHandling.h>
+#include <mcld/Target/GNULDBackend.h>
+#include <llvm/ADT/StringRef.h>
+#include <llvm/Support/Casting.h>
+#include <llvm/Support/Format.h>
+#include <cassert>
+#include <map>
+#include <set>
+#include <zlib.h>
+using namespace mcld;
+static bool isSymCtorOrDtor(const ResolveInfo& pSym)
+ // We can always fold ctors and dtors since accessing function pointer in C++
+ // is forbidden.
+ llvm::StringRef name(, pSym.nameSize());
+ if (!name.startswith("_ZZ") && !name.startswith("_ZN")) {
+ return false;
+ }
+ return isCtorOrDtor(, pSym.nameSize());
+IdenticalCodeFolding::IdenticalCodeFolding(const LinkerConfig& pConfig,
+ const TargetLDBackend& pBackend,
+ Module& pModule)
+ : m_Config(pConfig), m_Backend(pBackend), m_Module(pModule)
+void IdenticalCodeFolding::foldIdenticalCode()
+ // 1. Find folding candidates.
+ FoldingCandidates candidate_list;
+ findCandidates(candidate_list);
+ // 2. Initialize constant section content
+ for (size_t i = 0; i < candidate_list.size(); ++i) {
+ candidate_list[i].initConstantContent(m_Backend, m_KeptSections);
+ }
+ // 3. Find identical code until convergence
+ bool converged = false;
+ size_t iterations = 0;
+ while (!converged && (iterations < m_Config.options().getICFIterations())) {
+ converged = matchCandidates(candidate_list);
+ ++iterations;
+ }
+ if (m_Config.options().printICFSections()) {
+ debug(diag::debug_icf_iterations) << iterations;
+ }
+ // 4. Fold the identical code
+ typedef std::set<Input*> FoldedObjects;
+ FoldedObjects folded_objs;
+ KeptSections::iterator kept, keptEnd = m_KeptSections.end();
+ size_t index = 0;
+ for (kept = m_KeptSections.begin(); kept != keptEnd; ++kept, ++index) {
+ LDSection* sect = (*kept).first;
+ Input* obj = (*kept).second.first;
+ size_t kept_index = (*kept).second.second;
+ if (index != kept_index) {
+ sect->setKind(LDFileFormat::Folded);
+ folded_objs.insert(obj);
+ if (m_Config.options().printICFSections()) {
+ KeptSections::iterator it = m_KeptSections.begin() + kept_index;
+ LDSection* kept_sect = (*it).first;
+ Input* kept_obj = (*it).second.first;
+ debug(diag::debug_icf_folded_section) << sect->name()
+ << obj->name()
+ << kept_sect->name()
+ << kept_obj->name();
+ }
+ }
+ }
+ // Adjust the fragment reference of the folded symbols.
+ FoldedObjects::iterator fobj, fobjEnd = folded_objs.end();
+ for (fobj = folded_objs.begin(); fobj != fobjEnd; ++fobj) {
+ LDContext::sym_iterator sym, symEnd = (*fobj)->context()->symTabEnd();
+ for (sym = (*fobj)->context()->symTabBegin(); sym != symEnd; ++sym) {
+ if ((*sym)->hasFragRef() && ((*sym)->type() == ResolveInfo::Function)) {
+ LDSymbol* out_sym = (*sym)->resolveInfo()->outSymbol();
+ FragmentRef* frag_ref = out_sym->fragRef();
+ LDSection* sect = &(frag_ref->frag()->getParent()->getSection());
+ if (sect->kind() == LDFileFormat::Folded) {
+ size_t kept_index = m_KeptSections[sect].second;
+ LDSection* kept_sect =
+ (*(m_KeptSections.begin() + kept_index)).first;
+ frag_ref->assign(kept_sect->getSectionData()->front(),
+ frag_ref->offset());
+ }
+ }
+ } // for each symbol
+ } // for each folded object
+void IdenticalCodeFolding::findCandidates(FoldingCandidates& pCandidateList)
+ Module::obj_iterator obj, objEnd = m_Module.obj_end();
+ for (obj = m_Module.obj_begin(); obj != objEnd; ++obj) {
+ std::set<const LDSection*> funcptr_access_set;
+ typedef std::map<LDSection*, LDSection*> CandidateMap;
+ CandidateMap candidate_map;
+ LDContext::sect_iterator sect, sectEnd = (*obj)->context()->sectEnd();
+ for (sect = (*obj)->context()->sectBegin(); sect != sectEnd; ++sect) {
+ switch ((*sect)->kind()) {
+ case LDFileFormat::TEXT: {
+ candidate_map.insert(std::make_pair(*sect, (LDSection*)NULL));
+ break;
+ }
+ case LDFileFormat::Relocation: {
+ LDSection* target = (*sect)->getLink();
+ if (target->kind() == LDFileFormat::TEXT) {
+ candidate_map[target] = *sect;
+ }
+ // Safe icf
+ if (m_Config.options().getICFMode() == GeneralOptions::ICF_Safe) {
+ RelocData::iterator rel, relEnd = (*sect)->getRelocData()->end();
+ for (rel = (*sect)->getRelocData()->begin(); rel != relEnd; ++rel) {
+ LDSymbol* sym = rel->symInfo()->outSymbol();
+ if (sym->hasFragRef() && (sym->type() == ResolveInfo::Function)) {
+ const LDSection* def =
+ &sym->fragRef()->frag()->getParent()->getSection();
+ if (!isSymCtorOrDtor(*rel->symInfo()) &&
+ m_Backend.mayHaveUnsafeFunctionPointerAccess(*target) &&
+ m_Backend.
+ getRelocator()->mayHaveFunctionPointerAccess(*rel)) {
+ funcptr_access_set.insert(def);
+ }
+ }
+ } // for each reloc
+ }
+ break;
+ }
+ default: {
+ // skip
+ break;;
+ }
+ } // end of switch
+ } // for each section
+ CandidateMap::iterator candidate, candidateEnd = candidate_map.end();
+ for (candidate = candidate_map.begin(); candidate != candidateEnd;
+ ++candidate) {
+ if ((m_Config.options().getICFMode() == GeneralOptions::ICF_All) ||
+ (funcptr_access_set.count(candidate->first) == 0)) {
+ size_t index = m_KeptSections.size();
+ m_KeptSections[candidate->first] = ObjectAndId(*obj, index);
+ pCandidateList.push_back(FoldingCandidate(candidate->first,
+ candidate->second,
+ *obj));
+ }
+ } // for each possible candidate
+ } // for each obj
+bool IdenticalCodeFolding::matchCandidates(FoldingCandidates& pCandidateList)
+ typedef std::multimap<uint32_t, size_t> ChecksumMap;
+ ChecksumMap checksum_map;
+ std::vector<std::string> contents(pCandidateList.size());
+ bool converged = true;
+ for (size_t index = 0; index < pCandidateList.size(); ++index) {
+ contents[index] = pCandidateList[index].
+ getContentWithVariables(m_Backend, m_KeptSections);
+ uint32_t checksum = ::crc32(0xFFFFFFFF,
+ (const uint8_t*)contents[index].c_str(),
+ contents[index].length());
+ size_t count = checksum_map.count(checksum);
+ if (count == 0) {
+ checksum_map.insert(std::make_pair(checksum, index));
+ } else {
+ std::pair<ChecksumMap::iterator, ChecksumMap::iterator> ret =
+ checksum_map.equal_range(checksum);
+ for (ChecksumMap::iterator it = ret.first; it != ret.second; ++it) {
+ size_t kept_index = (*it).second;
+ if (contents[index].compare(contents[kept_index]) == 0) {
+ m_KeptSections[pCandidateList[index].sect].second = kept_index;
+ converged = false;
+ break;
+ }
+ }
+ }
+ }
+ return converged;
+void IdenticalCodeFolding::FoldingCandidate::initConstantContent(
+ const TargetLDBackend& pBackend,
+ const IdenticalCodeFolding::KeptSections& pKeptSections)
+ // Get the static content from text.
+ assert(sect != NULL && sect->hasSectionData());
+ SectionData::const_iterator frag, fragEnd = sect->getSectionData()->end();
+ for (frag = sect->getSectionData()->begin(); frag != fragEnd; ++frag) {
+ switch (frag->getKind()) {
+ case Fragment::Region: {
+ const RegionFragment& region = llvm::cast<RegionFragment>(*frag);
+ content.append(region.getRegion().begin(), region.size());
+ break;
+ }
+ default: {
+ // FIXME: Currently we only take care of RegionFragment.
+ break;
+ }
+ }
+ }
+ // Get the static content from relocs.
+ if (reloc_sect != NULL && reloc_sect->hasRelocData()) {
+ RelocData::iterator rel, relEnd = reloc_sect->getRelocData()->end();
+ for (rel = reloc_sect->getRelocData()->begin(); rel != relEnd; ++rel) {
+ llvm::format_object4<Relocation::Type, Relocation::Address,
+ Relocation::Address, Relocation::Address>
+ rel_info("%x%llx%llx%llx", rel->type(), rel->symValue(),
+ rel->addend(), rel->place());
+ char rel_str[48];
+ rel_info.print(rel_str, sizeof(rel_str));
+ content.append(rel_str);
+ // Handle the recursive call.
+ LDSymbol* sym = rel->symInfo()->outSymbol();
+ if ((sym->type() == ResolveInfo::Function) && sym->hasFragRef()) {
+ LDSection* def = &sym->fragRef()->frag()->getParent()->getSection();
+ if (def == sect) {
+ continue;
+ }
+ }
+ if (!pBackend.isSymbolPreemptible(*rel->symInfo()) &&
+ sym->hasFragRef() &&
+ (pKeptSections.find(
+ &sym->fragRef()->frag()->getParent()->getSection()) !=
+ pKeptSections.end())) {
+ // Mark this reloc as a variable.
+ variable_relocs.push_back(rel);
+ } else {
+ // TODO: Support inlining merge sections if possible (target-dependent).
+ if ((sym->binding() == ResolveInfo::Local) ||
+ (sym->binding() == ResolveInfo::Absolute)) {
+ // ABS or Local symbols.
+ content.append(sym->name())
+ .append(obj->name())
+ .append(obj->path().native());
+ } else {
+ content.append(sym->name());
+ }
+ }
+ }
+ }
+std::string IdenticalCodeFolding::FoldingCandidate::getContentWithVariables(
+ const TargetLDBackend& pBackend,
+ const IdenticalCodeFolding::KeptSections& pKeptSections)
+ std::string result(content);
+ // Compute the variable content from relocs.
+ std::vector<Relocation*>::const_iterator rel, relEnd = variable_relocs.end();
+ for (rel = variable_relocs.begin(); rel != relEnd; ++rel) {
+ LDSymbol* sym = (*rel)->symInfo()->outSymbol();
+ LDSection* def = &sym->fragRef()->frag()->getParent()->getSection();
+ // Use the kept section index.
+ KeptSections::const_iterator it = pKeptSections.find(def);
+ llvm::format_object1<size_t> kept_info("%x", (*it).second.second);
+ char kept_str[8];
+ kept_info.print(kept_str, sizeof(kept_str));
+ result.append(kept_str);
+ }
+ return result;
diff --git a/lib/Support/ b/lib/Support/
index 36983ed..dfff7c9 100644
--- a/lib/Support/
+++ b/lib/Support/
@@ -2,6 +2,7 @@ LOCAL_PATH:= $(call my-dir)
mcld_support_SRC_FILES := \
CommandLine.cpp \
+ Demangle.cpp \
Directory.cpp \
FileHandle.cpp \
FileOutputBuffer.cpp \