Add --bp-compression-sort-section=<glob>[=<layout_priority>[=<match_priority>]] to let users split input sections into multiple compression groups, run balanced partitioning independently per group, and leave out sections that are poor candidates for BP. This replaces the old coarse --bp-compression-sort with a more explicit, user-controlled one. In ELF, the glob matches input section names (.text.unlikely.cold1). In Mach-O, it matches the concatenated segment+section name (__TEXT__text). layout_priority controls group placement in the final layout. match_priority resolves conflicts when multiple globs match the same section: explicit priority beats positional matching, and among positional specs the last match wins. A CRTP hook getCompressionSubgroupKey() allows backends to further subdivide glob groups into independent BP instances. This allows Mach-O backend to separate cold functions via N_COLD_FUNC in the future. The deprecated --bp-compression-sort option keeps its existing function/data behavior by assigning sections to fixed legacy groups.
103 lines
3.8 KiB
C++
103 lines
3.8 KiB
C++
//===- BPSectionOrderer.cpp -----------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "BPSectionOrderer.h"
|
|
#include "InputFiles.h"
|
|
#include "InputSection.h"
|
|
#include "SymbolTable.h"
|
|
#include "Symbols.h"
|
|
#include "lld/Common/BPSectionOrdererBase.inc"
|
|
#include "llvm/Support/Endian.h"
|
|
|
|
using namespace llvm;
|
|
using namespace lld::elf;
|
|
|
|
namespace {
|
|
struct BPOrdererELF;
|
|
}
|
|
template <> struct lld::BPOrdererTraits<struct BPOrdererELF> {
|
|
using Section = elf::InputSectionBase;
|
|
using Defined = elf::Defined;
|
|
};
|
|
namespace {
|
|
struct BPOrdererELF : lld::BPOrderer<BPOrdererELF> {
|
|
DenseMap<const InputSectionBase *, Defined *> secToSym;
|
|
|
|
static uint64_t getSize(const Section &sec) { return sec.getSize(); }
|
|
static bool isCodeSection(const Section &sec) {
|
|
return sec.flags & ELF::SHF_EXECINSTR;
|
|
}
|
|
static StringRef getSectionName(const Section &sec) { return sec.name; }
|
|
ArrayRef<Defined *> getSymbols(const Section &sec) {
|
|
auto it = secToSym.find(&sec);
|
|
if (it == secToSym.end())
|
|
return {};
|
|
return ArrayRef(it->second);
|
|
}
|
|
|
|
static void
|
|
getSectionHashes(const Section &sec, SmallVectorImpl<uint64_t> &hashes,
|
|
const DenseMap<const void *, uint64_t> §ionToIdx) {
|
|
constexpr unsigned windowSize = 4;
|
|
|
|
// Calculate content hashes: k-mers and the last k-1 bytes.
|
|
ArrayRef<uint8_t> data = sec.content();
|
|
if (data.size() >= windowSize)
|
|
for (size_t i = 0; i <= data.size() - windowSize; ++i)
|
|
hashes.push_back(support::endian::read32le(data.data() + i));
|
|
for (uint8_t byte : data.take_back(windowSize - 1))
|
|
hashes.push_back(byte);
|
|
|
|
llvm::sort(hashes);
|
|
hashes.erase(llvm::unique(hashes), hashes.end());
|
|
}
|
|
|
|
static StringRef getSymName(const Defined &sym) { return sym.getName(); }
|
|
static uint64_t getSymValue(const Defined &sym) { return sym.value; }
|
|
static uint64_t getSymSize(const Defined &sym) { return sym.size; }
|
|
};
|
|
} // namespace
|
|
|
|
DenseMap<const InputSectionBase *, int> elf::runBalancedPartitioning(
|
|
Ctx &ctx, StringRef profilePath,
|
|
ArrayRef<BPCompressionSortSpec> compressionSortSpecs,
|
|
bool forFunctionCompression, bool forDataCompression,
|
|
bool compressionSortStartupFunctions, bool verbose) {
|
|
// Collect candidate sections and associated symbols.
|
|
SmallVector<InputSectionBase *> sections;
|
|
DenseMap<CachedHashStringRef, std::set<unsigned>> rootSymbolToSectionIdxs;
|
|
BPOrdererELF orderer;
|
|
|
|
auto addSection = [&](Symbol &sym) {
|
|
auto *d = dyn_cast<Defined>(&sym);
|
|
if (!d)
|
|
return;
|
|
auto *sec = dyn_cast_or_null<InputSection>(d->section);
|
|
// Skip section symbols. Skip empty, discarded, ICF folded sections, .bss.
|
|
// ICF folded sections are already dead (!isLive()), so no separate check
|
|
// is needed.
|
|
if (sym.isSection() || !sec || sec->size == 0 || !sec->isLive() ||
|
|
!sec->content().data() || !orderer.secToSym.try_emplace(sec, d).second)
|
|
return;
|
|
rootSymbolToSectionIdxs[CachedHashStringRef(
|
|
lld::utils::getRootSymbol(sym.getName()))]
|
|
.insert(sections.size());
|
|
sections.emplace_back(sec);
|
|
};
|
|
|
|
for (Symbol *sym : ctx.symtab->getSymbols())
|
|
addSection(*sym);
|
|
for (ELFFileBase *file : ctx.objectFiles)
|
|
for (Symbol *sym : file->getLocalSymbols())
|
|
addSection(*sym);
|
|
return orderer.computeOrder(profilePath, compressionSortSpecs,
|
|
forFunctionCompression, forDataCompression,
|
|
compressionSortStartupFunctions, verbose,
|
|
sections, rootSymbolToSectionIdxs);
|
|
}
|