LLVM  8.0.1
CrossDSOCFI.cpp
Go to the documentation of this file.
1 //===-- CrossDSOCFI.cpp - Externalize this module's CFI checks ------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This pass exports all llvm.bitset's found in the module in the form of a
11 // __cfi_check function, which can be used to verify cross-DSO call targets.
12 //
13 //===----------------------------------------------------------------------===//
14 
16 #include "llvm/ADT/SetVector.h"
17 #include "llvm/ADT/Statistic.h"
18 #include "llvm/ADT/Triple.h"
19 #include "llvm/IR/Constant.h"
20 #include "llvm/IR/Constants.h"
21 #include "llvm/IR/Function.h"
22 #include "llvm/IR/GlobalObject.h"
23 #include "llvm/IR/GlobalVariable.h"
24 #include "llvm/IR/IRBuilder.h"
25 #include "llvm/IR/Instructions.h"
26 #include "llvm/IR/Intrinsics.h"
27 #include "llvm/IR/MDBuilder.h"
28 #include "llvm/IR/Module.h"
29 #include "llvm/IR/Operator.h"
30 #include "llvm/Pass.h"
31 #include "llvm/Support/Debug.h"
33 #include "llvm/Transforms/IPO.h"
34 
35 using namespace llvm;
36 
37 #define DEBUG_TYPE "cross-dso-cfi"
38 
39 STATISTIC(NumTypeIds, "Number of unique type identifiers");
40 
41 namespace {
42 
43 struct CrossDSOCFI : public ModulePass {
44  static char ID;
45  CrossDSOCFI() : ModulePass(ID) {
47  }
48 
49  MDNode *VeryLikelyWeights;
50 
51  ConstantInt *extractNumericTypeId(MDNode *MD);
52  void buildCFICheck(Module &M);
53  bool runOnModule(Module &M) override;
54 };
55 
56 } // anonymous namespace
57 
58 INITIALIZE_PASS_BEGIN(CrossDSOCFI, "cross-dso-cfi", "Cross-DSO CFI", false,
59  false)
60 INITIALIZE_PASS_END(CrossDSOCFI, "cross-dso-cfi", "Cross-DSO CFI", false, false)
61 char CrossDSOCFI::ID = 0;
62 
63 ModulePass *llvm::createCrossDSOCFIPass() { return new CrossDSOCFI; }
64 
65 /// Extracts a numeric type identifier from an MDNode containing type metadata.
66 ConstantInt *CrossDSOCFI::extractNumericTypeId(MDNode *MD) {
67  // This check excludes vtables for classes inside anonymous namespaces.
68  auto TM = dyn_cast<ValueAsMetadata>(MD->getOperand(1));
69  if (!TM)
70  return nullptr;
71  auto C = dyn_cast_or_null<ConstantInt>(TM->getValue());
72  if (!C) return nullptr;
73  // We are looking for i64 constants.
74  if (C->getBitWidth() != 64) return nullptr;
75 
76  return C;
77 }
78 
79 /// buildCFICheck - emits __cfi_check for the current module.
80 void CrossDSOCFI::buildCFICheck(Module &M) {
81  // FIXME: verify that __cfi_check ends up near the end of the code section,
82  // but before the jump slots created in LowerTypeTests.
83  SetVector<uint64_t> TypeIds;
85  for (GlobalObject &GO : M.global_objects()) {
86  Types.clear();
87  GO.getMetadata(LLVMContext::MD_type, Types);
88  for (MDNode *Type : Types) {
89  // Sanity check. GO must not be a function declaration.
90  assert(!isa<Function>(&GO) || !cast<Function>(&GO)->isDeclaration());
91 
92  if (ConstantInt *TypeId = extractNumericTypeId(Type))
93  TypeIds.insert(TypeId->getZExtValue());
94  }
95  }
96 
97  NamedMDNode *CfiFunctionsMD = M.getNamedMetadata("cfi.functions");
98  if (CfiFunctionsMD) {
99  for (auto Func : CfiFunctionsMD->operands()) {
100  assert(Func->getNumOperands() >= 2);
101  for (unsigned I = 2; I < Func->getNumOperands(); ++I)
102  if (ConstantInt *TypeId =
103  extractNumericTypeId(cast<MDNode>(Func->getOperand(I).get())))
104  TypeIds.insert(TypeId->getZExtValue());
105  }
106  }
107 
108  LLVMContext &Ctx = M.getContext();
110  "__cfi_check", Type::getVoidTy(Ctx), Type::getInt64Ty(Ctx),
113  // Take over the existing function. The frontend emits a weak stub so that the
114  // linker knows about the symbol; this pass replaces the function body.
115  F->deleteBody();
116  F->setAlignment(4096);
117 
118  Triple T(M.getTargetTriple());
119  if (T.isARM() || T.isThumb())
120  F->addFnAttr("target-features", "+thumb-mode");
121 
122  auto args = F->arg_begin();
123  Value &CallSiteTypeId = *(args++);
124  CallSiteTypeId.setName("CallSiteTypeId");
125  Value &Addr = *(args++);
126  Addr.setName("Addr");
127  Value &CFICheckFailData = *(args++);
128  CFICheckFailData.setName("CFICheckFailData");
129  assert(args == F->arg_end());
130 
131  BasicBlock *BB = BasicBlock::Create(Ctx, "entry", F);
132  BasicBlock *ExitBB = BasicBlock::Create(Ctx, "exit", F);
133 
134  BasicBlock *TrapBB = BasicBlock::Create(Ctx, "fail", F);
135  IRBuilder<> IRBFail(TrapBB);
136  Constant *CFICheckFailFn = M.getOrInsertFunction(
137  "__cfi_check_fail", Type::getVoidTy(Ctx), Type::getInt8PtrTy(Ctx),
138  Type::getInt8PtrTy(Ctx));
139  IRBFail.CreateCall(CFICheckFailFn, {&CFICheckFailData, &Addr});
140  IRBFail.CreateBr(ExitBB);
141 
142  IRBuilder<> IRBExit(ExitBB);
143  IRBExit.CreateRetVoid();
144 
145  IRBuilder<> IRB(BB);
146  SwitchInst *SI = IRB.CreateSwitch(&CallSiteTypeId, TrapBB, TypeIds.size());
147  for (uint64_t TypeId : TypeIds) {
148  ConstantInt *CaseTypeId = ConstantInt::get(Type::getInt64Ty(Ctx), TypeId);
149  BasicBlock *TestBB = BasicBlock::Create(Ctx, "test", F);
150  IRBuilder<> IRBTest(TestBB);
152 
153  Value *Test = IRBTest.CreateCall(
154  BitsetTestFn, {&Addr, MetadataAsValue::get(
155  Ctx, ConstantAsMetadata::get(CaseTypeId))});
156  BranchInst *BI = IRBTest.CreateCondBr(Test, ExitBB, TrapBB);
157  BI->setMetadata(LLVMContext::MD_prof, VeryLikelyWeights);
158 
159  SI->addCase(CaseTypeId, TestBB);
160  ++NumTypeIds;
161  }
162 }
163 
164 bool CrossDSOCFI::runOnModule(Module &M) {
165  VeryLikelyWeights =
166  MDBuilder(M.getContext()).createBranchWeights((1U << 20) - 1, 1);
167  if (M.getModuleFlag("Cross-DSO CFI") == nullptr)
168  return false;
169  buildCFICheck(M);
170  return true;
171 }
172 
174  CrossDSOCFI Impl;
175  bool Changed = Impl.runOnModule(M);
176  if (!Changed)
177  return PreservedAnalyses::all();
178  return PreservedAnalyses::none();
179 }
uint64_t CallInst * C
PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM)
const std::string & getTargetTriple() const
Get the target triple which is a string describing the target host.
Definition: Module.h:240
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
This class represents lattice values for constants.
Definition: AllocatorList.h:24
size_type size() const
Determine the number of elements in the SetVector.
Definition: SetVector.h:78
Constant * getOrInsertFunction(StringRef Name, FunctionType *T, AttributeList AttributeList)
Look up the specified function in the module symbol table.
Definition: Module.cpp:144
A Module instance is used to store all the information related to an LLVM module. ...
Definition: Module.h:65
void addCase(ConstantInt *OnVal, BasicBlock *Dest)
Add an entry to the switch instruction.
arg_iterator arg_end()
Definition: Function.h:680
STATISTIC(NumFunctions, "Total number of functions")
Metadata node.
Definition: Metadata.h:864
F(f)
const MDOperand & getOperand(unsigned I) const
Definition: Metadata.h:1069
static IntegerType * getInt64Ty(LLVMContext &C)
Definition: Type.cpp:177
void setAlignment(unsigned Align)
Definition: Globals.cpp:116
iterator_range< global_object_iterator > global_objects()
Definition: Module.h:659
A tuple of MDNodes.
Definition: Metadata.h:1326
LLVMContext & getContext() const
Get the global data context.
Definition: Module.h:244
ModulePass * createCrossDSOCFIPass()
This pass export CFI checks for use by external modules.
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:743
void setName(const Twine &Name)
Change the name of the value.
Definition: Value.cpp:285
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition: SetVector.h:142
void initializeCrossDSOCFIPass(PassRegistry &)
#define T
NamedMDNode * getNamedMetadata(const Twine &Name) const
Return the first NamedMDNode in the module with the specified name.
Definition: Module.cpp:252
Value wrapper in the Metadata hierarchy.
Definition: Metadata.h:339
static ConstantAsMetadata * get(Constant *C)
Definition: Metadata.h:410
iterator_range< op_iterator > operands()
Definition: Metadata.h:1418
Function * getDeclaration(Module *M, ID id, ArrayRef< Type *> Tys=None)
Create or insert an LLVM Function declaration for an intrinsic, and return it.
Definition: Function.cpp:1020
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
Definition: PassManager.h:157
static MetadataAsValue * get(LLVMContext &Context, Metadata *MD)
Definition: Metadata.cpp:106
A set of analyses that are preserved following a run of a transformation pass.
Definition: PassManager.h:154
LLVM Basic Block Representation.
Definition: BasicBlock.h:58
The instances of the Type class are immutable: once they are created, they are never changed...
Definition: Type.h:46
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:69
Conditional or Unconditional Branch instruction.
Metadata * getModuleFlag(StringRef Key) const
Return the corresponding value if Key appears in module flags, otherwise return null.
Definition: Module.cpp:312
void deleteBody()
deleteBody - This method deletes the body of the function, and converts the linkage to external...
Definition: Function.h:609
This is an important base class in LLVM.
Definition: Constant.h:42
This file contains the declarations for the subclasses of Constant, which represent the different fla...
static Type * getVoidTy(LLVMContext &C)
Definition: Type.cpp:161
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
Definition: BasicBlock.h:100
arg_iterator arg_begin()
Definition: Function.h:671
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: PassManager.h:160
static PointerType * getInt8PtrTy(LLVMContext &C, unsigned AS=0)
Definition: Type.cpp:220
INITIALIZE_PASS_END(RegBankSelect, DEBUG_TYPE, "Assign register bank of generic virtual registers", false, false) RegBankSelect
void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
Definition: Metadata.cpp:1226
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44
This is the shared class of boolean and integer constants.
Definition: Constants.h:84
This is a &#39;vector&#39; (really, a variable-sized array), optimized for the case when the array is small...
Definition: SmallVector.h:847
Module.h This file contains the declarations for the Module class.
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:48
static Constant * get(Type *Ty, uint64_t V, bool isSigned=false)
If Ty is a vector type, return a Constant with a splat of the given value.
Definition: Constants.cpp:622
#define I(x, y, z)
Definition: MD5.cpp:58
ModulePass class - This class is used to implement unstructured interprocedural optimizations and ana...
Definition: Pass.h:225
LLVM_NODISCARD std::enable_if<!is_simple_type< Y >::value, typename cast_retty< X, const Y >::ret_type >::type dyn_cast(const Y &Val)
Definition: Casting.h:323
Multiway switch.
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
LLVM Value Representation.
Definition: Value.h:73
A vector that has set insertion semantics.
Definition: SetVector.h:41
void addFnAttr(Attribute::AttrKind Kind)
Add function attributes to this function.
Definition: Function.h:230
A container for analyses that lazily runs them and caches their results.