blob: 69d0bca0bd77201966ffb8132eaaa4404f55b2f3 [file] [log] [blame]
//===---------------- BPFAdjustOpt.cpp - Adjust Optimization --------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// Adjust optimization to make the code more kernel verifier friendly.
//
//===----------------------------------------------------------------------===//
#include "BPF.h"
#include "BPFCORE.h"
#include "BPFTargetMachine.h"
#include "llvm/IR/Instruction.h"
#include "llvm/IR/Instructions.h"
#include "llvm/IR/IntrinsicsBPF.h"
#include "llvm/IR/Module.h"
#include "llvm/IR/PatternMatch.h"
#include "llvm/IR/Type.h"
#include "llvm/IR/User.h"
#include "llvm/IR/Value.h"
#include "llvm/Pass.h"
#include "llvm/Transforms/Utils/BasicBlockUtils.h"
#define DEBUG_TYPE "bpf-adjust-opt"
using namespace llvm;
using namespace llvm::PatternMatch;
static cl::opt<bool>
DisableBPFserializeICMP("bpf-disable-serialize-icmp", cl::Hidden,
cl::desc("BPF: Disable Serializing ICMP insns."),
cl::init(false));
static cl::opt<bool> DisableBPFavoidSpeculation(
"bpf-disable-avoid-speculation", cl::Hidden,
cl::desc("BPF: Disable Avoiding Speculative Code Motion."),
cl::init(false));
namespace {
class BPFAdjustOpt final : public ModulePass {
public:
static char ID;
BPFAdjustOpt() : ModulePass(ID) {}
bool runOnModule(Module &M) override;
};
class BPFAdjustOptImpl {
struct PassThroughInfo {
Instruction *Input;
Instruction *UsedInst;
uint32_t OpIdx;
PassThroughInfo(Instruction *I, Instruction *U, uint32_t Idx)
: Input(I), UsedInst(U), OpIdx(Idx) {}
};
public:
BPFAdjustOptImpl(Module *M) : M(M) {}
bool run();
private:
Module *M;
SmallVector<PassThroughInfo, 16> PassThroughs;
bool adjustICmpToBuiltin();
void adjustBasicBlock(BasicBlock &BB);
bool serializeICMPCrossBB(BasicBlock &BB);
void adjustInst(Instruction &I);
bool serializeICMPInBB(Instruction &I);
bool avoidSpeculation(Instruction &I);
bool insertPassThrough();
};
} // End anonymous namespace
char BPFAdjustOpt::ID = 0;
INITIALIZE_PASS(BPFAdjustOpt, "bpf-adjust-opt", "BPF Adjust Optimization",
false, false)
ModulePass *llvm::createBPFAdjustOpt() { return new BPFAdjustOpt(); }
bool BPFAdjustOpt::runOnModule(Module &M) { return BPFAdjustOptImpl(&M).run(); }
bool BPFAdjustOptImpl::run() {
bool Changed = adjustICmpToBuiltin();
for (Function &F : *M)
for (auto &BB : F) {
adjustBasicBlock(BB);
for (auto &I : BB)
adjustInst(I);
}
return insertPassThrough() || Changed;
}
// Commit acabad9ff6bf ("[InstCombine] try to canonicalize icmp with
// trunc op into mask and cmp") added a transformation to
// convert "(conv)a < power_2_const" to "a & <const>" in certain
// cases and bpf kernel verifier has to handle the resulted code
// conservatively and this may reject otherwise legitimate program.
// Here, we change related icmp code to a builtin which will
// be restored to original icmp code later to prevent that
// InstCombine transformatin.
bool BPFAdjustOptImpl::adjustICmpToBuiltin() {
bool Changed = false;
ICmpInst *ToBeDeleted = nullptr;
for (Function &F : *M)
for (auto &BB : F)
for (auto &I : BB) {
if (ToBeDeleted) {
ToBeDeleted->eraseFromParent();
ToBeDeleted = nullptr;
}
auto *Icmp = dyn_cast<ICmpInst>(&I);
if (!Icmp)
continue;
Value *Op0 = Icmp->getOperand(0);
if (!isa<TruncInst>(Op0))
continue;
auto ConstOp1 = dyn_cast<ConstantInt>(Icmp->getOperand(1));
if (!ConstOp1)
continue;
auto ConstOp1Val = ConstOp1->getValue().getZExtValue();
auto Op = Icmp->getPredicate();
if (Op == ICmpInst::ICMP_ULT || Op == ICmpInst::ICMP_UGE) {
if ((ConstOp1Val - 1) & ConstOp1Val)
continue;
} else if (Op == ICmpInst::ICMP_ULE || Op == ICmpInst::ICMP_UGT) {
if (ConstOp1Val & (ConstOp1Val + 1))
continue;
} else {
continue;
}
Constant *Opcode =
ConstantInt::get(Type::getInt32Ty(BB.getContext()), Op);
Function *Fn = Intrinsic::getDeclaration(
M, Intrinsic::bpf_compare, {Op0->getType(), ConstOp1->getType()});
auto *NewInst = CallInst::Create(Fn, {Opcode, Op0, ConstOp1});
BB.getInstList().insert(I.getIterator(), NewInst);
Icmp->replaceAllUsesWith(NewInst);
Changed = true;
ToBeDeleted = Icmp;
}
return Changed;
}
bool BPFAdjustOptImpl::insertPassThrough() {
for (auto &Info : PassThroughs) {
auto *CI = BPFCoreSharedInfo::insertPassThrough(
M, Info.UsedInst->getParent(), Info.Input, Info.UsedInst);
Info.UsedInst->setOperand(Info.OpIdx, CI);
}
return !PassThroughs.empty();
}
// To avoid combining conditionals in the same basic block by
// instrcombine optimization.
bool BPFAdjustOptImpl::serializeICMPInBB(Instruction &I) {
// For:
// comp1 = icmp <opcode> ...;
// comp2 = icmp <opcode> ...;
// ... or comp1 comp2 ...
// changed to:
// comp1 = icmp <opcode> ...;
// comp2 = icmp <opcode> ...;
// new_comp1 = __builtin_bpf_passthrough(seq_num, comp1)
// ... or new_comp1 comp2 ...
Value *Op0, *Op1;
// Use LogicalOr (accept `or i1` as well as `select i1 Op0, true, Op1`)
if (!match(&I, m_LogicalOr(m_Value(Op0), m_Value(Op1))))
return false;
auto *Icmp1 = dyn_cast<ICmpInst>(Op0);
if (!Icmp1)
return false;
auto *Icmp2 = dyn_cast<ICmpInst>(Op1);
if (!Icmp2)
return false;
Value *Icmp1Op0 = Icmp1->getOperand(0);
Value *Icmp2Op0 = Icmp2->getOperand(0);
if (Icmp1Op0 != Icmp2Op0)
return false;
// Now we got two icmp instructions which feed into
// an "or" instruction.
PassThroughInfo Info(Icmp1, &I, 0);
PassThroughs.push_back(Info);
return true;
}
// To avoid combining conditionals in the same basic block by
// instrcombine optimization.
bool BPFAdjustOptImpl::serializeICMPCrossBB(BasicBlock &BB) {
// For:
// B1:
// comp1 = icmp <opcode> ...;
// if (comp1) goto B2 else B3;
// B2:
// comp2 = icmp <opcode> ...;
// if (comp2) goto B4 else B5;
// B4:
// ...
// changed to:
// B1:
// comp1 = icmp <opcode> ...;
// comp1 = __builtin_bpf_passthrough(seq_num, comp1);
// if (comp1) goto B2 else B3;
// B2:
// comp2 = icmp <opcode> ...;
// if (comp2) goto B4 else B5;
// B4:
// ...
// Check basic predecessors, if two of them (say B1, B2) are using
// icmp instructions to generate conditions and one is the predesessor
// of another (e.g., B1 is the predecessor of B2). Add a passthrough
// barrier after icmp inst of block B1.
BasicBlock *B2 = BB.getSinglePredecessor();
if (!B2)
return false;
BasicBlock *B1 = B2->getSinglePredecessor();
if (!B1)
return false;
Instruction *TI = B2->getTerminator();
auto *BI = dyn_cast<BranchInst>(TI);
if (!BI || !BI->isConditional())
return false;
auto *Cond = dyn_cast<ICmpInst>(BI->getCondition());
if (!Cond || B2->getFirstNonPHI() != Cond)
return false;
Value *B2Op0 = Cond->getOperand(0);
auto Cond2Op = Cond->getPredicate();
TI = B1->getTerminator();
BI = dyn_cast<BranchInst>(TI);
if (!BI || !BI->isConditional())
return false;
Cond = dyn_cast<ICmpInst>(BI->getCondition());
if (!Cond)
return false;
Value *B1Op0 = Cond->getOperand(0);
auto Cond1Op = Cond->getPredicate();
if (B1Op0 != B2Op0)
return false;
if (Cond1Op == ICmpInst::ICMP_SGT || Cond1Op == ICmpInst::ICMP_SGE) {
if (Cond2Op != ICmpInst::ICMP_SLT && Cond1Op != ICmpInst::ICMP_SLE)
return false;
} else if (Cond1Op == ICmpInst::ICMP_SLT || Cond1Op == ICmpInst::ICMP_SLE) {
if (Cond2Op != ICmpInst::ICMP_SGT && Cond1Op != ICmpInst::ICMP_SGE)
return false;
} else {
return false;
}
PassThroughInfo Info(Cond, BI, 0);
PassThroughs.push_back(Info);
return true;
}
// To avoid speculative hoisting certain computations out of
// a basic block.
bool BPFAdjustOptImpl::avoidSpeculation(Instruction &I) {
if (auto *LdInst = dyn_cast<LoadInst>(&I)) {
if (auto *GV = dyn_cast<GlobalVariable>(LdInst->getOperand(0))) {
if (GV->hasAttribute(BPFCoreSharedInfo::AmaAttr) ||
GV->hasAttribute(BPFCoreSharedInfo::TypeIdAttr))
return false;
}
}
if (!isa<LoadInst>(&I) && !isa<CallInst>(&I))
return false;
// For:
// B1:
// var = ...
// ...
// /* icmp may not be in the same block as var = ... */
// comp1 = icmp <opcode> var, <const>;
// if (comp1) goto B2 else B3;
// B2:
// ... var ...
// change to:
// B1:
// var = ...
// ...
// /* icmp may not be in the same block as var = ... */
// comp1 = icmp <opcode> var, <const>;
// if (comp1) goto B2 else B3;
// B2:
// var = __builtin_bpf_passthrough(seq_num, var);
// ... var ...
bool isCandidate = false;
SmallVector<PassThroughInfo, 4> Candidates;
for (User *U : I.users()) {
Instruction *Inst = dyn_cast<Instruction>(U);
if (!Inst)
continue;
// May cover a little bit more than the
// above pattern.
if (auto *Icmp1 = dyn_cast<ICmpInst>(Inst)) {
Value *Icmp1Op1 = Icmp1->getOperand(1);
if (!isa<Constant>(Icmp1Op1))
return false;
isCandidate = true;
continue;
}
// Ignore the use in the same basic block as the definition.
if (Inst->getParent() == I.getParent())
continue;
// use in a different basic block, If there is a call or
// load/store insn before this instruction in this basic
// block. Most likely it cannot be hoisted out. Skip it.
for (auto &I2 : *Inst->getParent()) {
if (isa<CallInst>(&I2))
return false;
if (isa<LoadInst>(&I2) || isa<StoreInst>(&I2))
return false;
if (&I2 == Inst)
break;
}
// It should be used in a GEP or a simple arithmetic like
// ZEXT/SEXT which is used for GEP.
if (Inst->getOpcode() == Instruction::ZExt ||
Inst->getOpcode() == Instruction::SExt) {
PassThroughInfo Info(&I, Inst, 0);
Candidates.push_back(Info);
} else if (auto *GI = dyn_cast<GetElementPtrInst>(Inst)) {
// traverse GEP inst to find Use operand index
unsigned i, e;
for (i = 1, e = GI->getNumOperands(); i != e; ++i) {
Value *V = GI->getOperand(i);
if (V == &I)
break;
}
if (i == e)
continue;
PassThroughInfo Info(&I, GI, i);
Candidates.push_back(Info);
}
}
if (!isCandidate || Candidates.empty())
return false;
llvm::append_range(PassThroughs, Candidates);
return true;
}
void BPFAdjustOptImpl::adjustBasicBlock(BasicBlock &BB) {
if (!DisableBPFserializeICMP && serializeICMPCrossBB(BB))
return;
}
void BPFAdjustOptImpl::adjustInst(Instruction &I) {
if (!DisableBPFserializeICMP && serializeICMPInBB(I))
return;
if (!DisableBPFavoidSpeculation && avoidSpeculation(I))
return;
}
PreservedAnalyses BPFAdjustOptPass::run(Module &M, ModuleAnalysisManager &AM) {
return BPFAdjustOptImpl(&M).run() ? PreservedAnalyses::none()
: PreservedAnalyses::all();
}