diff options
| author | Dimitry Andric <dim@FreeBSD.org> | 2017-04-16 16:01:22 +0000 | 
|---|---|---|
| committer | Dimitry Andric <dim@FreeBSD.org> | 2017-04-16 16:01:22 +0000 | 
| commit | 71d5a2540a98c81f5bcaeb48805e0e2881f530ef (patch) | |
| tree | 5343938942df402b49ec7300a1c25a2d4ccd5821 /lib/Transforms/Instrumentation | |
| parent | 31bbf64f3a4974a2d6c8b3b27ad2f519caf74057 (diff) | |
Diffstat (limited to 'lib/Transforms/Instrumentation')
| -rw-r--r-- | lib/Transforms/Instrumentation/AddressSanitizer.cpp | 156 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/DataFlowSanitizer.cpp | 78 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/EfficiencySanitizer.cpp | 22 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/IndirectCallPromotion.cpp | 506 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/InstrProfiling.cpp | 170 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/Instrumentation.cpp | 1 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/MemorySanitizer.cpp | 103 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/PGOInstrumentation.cpp | 353 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/SanitizerCoverage.cpp | 100 | ||||
| -rw-r--r-- | lib/Transforms/Instrumentation/ThreadSanitizer.cpp | 54 | 
10 files changed, 1151 insertions, 392 deletions
| diff --git a/lib/Transforms/Instrumentation/AddressSanitizer.cpp b/lib/Transforms/Instrumentation/AddressSanitizer.cpp index f5e9e7dd5a93..94cfc69ed555 100644 --- a/lib/Transforms/Instrumentation/AddressSanitizer.cpp +++ b/lib/Transforms/Instrumentation/AddressSanitizer.cpp @@ -80,6 +80,7 @@ static const uint64_t kMIPS64_ShadowOffset64 = 1ULL << 37;  static const uint64_t kAArch64_ShadowOffset64 = 1ULL << 36;  static const uint64_t kFreeBSD_ShadowOffset32 = 1ULL << 30;  static const uint64_t kFreeBSD_ShadowOffset64 = 1ULL << 46; +static const uint64_t kPS4CPU_ShadowOffset64 = 1ULL << 40;  static const uint64_t kWindowsShadowOffset32 = 3ULL << 28;  // The shadow memory space is dynamically allocated.  static const uint64_t kWindowsShadowOffset64 = kDynamicShadowSentinel; @@ -380,6 +381,7 @@ static ShadowMapping getShadowMapping(Triple &TargetTriple, int LongSize,    bool IsAndroid = TargetTriple.isAndroid();    bool IsIOS = TargetTriple.isiOS() || TargetTriple.isWatchOS();    bool IsFreeBSD = TargetTriple.isOSFreeBSD(); +  bool IsPS4CPU = TargetTriple.isPS4CPU();    bool IsLinux = TargetTriple.isOSLinux();    bool IsPPC64 = TargetTriple.getArch() == llvm::Triple::ppc64 ||                   TargetTriple.getArch() == llvm::Triple::ppc64le; @@ -392,6 +394,7 @@ static ShadowMapping getShadowMapping(Triple &TargetTriple, int LongSize,                    TargetTriple.getArch() == llvm::Triple::mips64el;    bool IsAArch64 = TargetTriple.getArch() == llvm::Triple::aarch64;    bool IsWindows = TargetTriple.isOSWindows(); +  bool IsFuchsia = TargetTriple.isOSFuchsia();    ShadowMapping Mapping; @@ -412,12 +415,18 @@ static ShadowMapping getShadowMapping(Triple &TargetTriple, int LongSize,      else        Mapping.Offset = kDefaultShadowOffset32;    } else {  // LongSize == 64 -    if (IsPPC64) +    // Fuchsia is always PIE, which means that the beginning of the address +    // space is always available. +    if (IsFuchsia) +      Mapping.Offset = 0; +    else if (IsPPC64)        Mapping.Offset = kPPC64_ShadowOffset64;      else if (IsSystemZ)        Mapping.Offset = kSystemZ_ShadowOffset64;      else if (IsFreeBSD)        Mapping.Offset = kFreeBSD_ShadowOffset64; +    else if (IsPS4CPU) +      Mapping.Offset = kPS4CPU_ShadowOffset64;      else if (IsLinux && IsX86_64) {        if (IsKasan)          Mapping.Offset = kLinuxKasan_ShadowOffset64; @@ -456,9 +465,9 @@ static ShadowMapping getShadowMapping(Triple &TargetTriple, int LongSize,    // offset is not necessary 1/8-th of the address space.  On SystemZ,    // we could OR the constant in a single instruction, but it's more    // efficient to load it once and use indexed addressing. -  Mapping.OrShadowOffset = !IsAArch64 && !IsPPC64 && !IsSystemZ -                           && !(Mapping.Offset & (Mapping.Offset - 1)) -                           && Mapping.Offset != kDynamicShadowSentinel; +  Mapping.OrShadowOffset = !IsAArch64 && !IsPPC64 && !IsSystemZ && !IsPS4CPU && +                           !(Mapping.Offset & (Mapping.Offset - 1)) && +                           Mapping.Offset != kDynamicShadowSentinel;    return Mapping;  } @@ -567,8 +576,6 @@ struct AddressSanitizer : public FunctionPass {    Type *IntptrTy;    ShadowMapping Mapping;    DominatorTree *DT; -  Function *AsanCtorFunction = nullptr; -  Function *AsanInitFunction = nullptr;    Function *AsanHandleNoReturnFunc;    Function *AsanPtrCmpFunction, *AsanPtrSubFunction;    // This array is indexed by AccessIsWrite, Experiment and log2(AccessSize). @@ -1561,31 +1568,31 @@ void AddressSanitizerModule::initializeCallbacks(Module &M) {    // Declare our poisoning and unpoisoning functions.    AsanPoisonGlobals = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      kAsanPoisonGlobalsName, IRB.getVoidTy(), IntptrTy, nullptr)); +      kAsanPoisonGlobalsName, IRB.getVoidTy(), IntptrTy));    AsanPoisonGlobals->setLinkage(Function::ExternalLinkage);    AsanUnpoisonGlobals = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      kAsanUnpoisonGlobalsName, IRB.getVoidTy(), nullptr)); +      kAsanUnpoisonGlobalsName, IRB.getVoidTy()));    AsanUnpoisonGlobals->setLinkage(Function::ExternalLinkage);    // Declare functions that register/unregister globals.    AsanRegisterGlobals = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      kAsanRegisterGlobalsName, IRB.getVoidTy(), IntptrTy, IntptrTy, nullptr)); +      kAsanRegisterGlobalsName, IRB.getVoidTy(), IntptrTy, IntptrTy));    AsanRegisterGlobals->setLinkage(Function::ExternalLinkage);    AsanUnregisterGlobals = checkSanitizerInterfaceFunction(        M.getOrInsertFunction(kAsanUnregisterGlobalsName, IRB.getVoidTy(), -                            IntptrTy, IntptrTy, nullptr)); +                            IntptrTy, IntptrTy));    AsanUnregisterGlobals->setLinkage(Function::ExternalLinkage);    // Declare the functions that find globals in a shared object and then invoke    // the (un)register function on them.    AsanRegisterImageGlobals =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          kAsanRegisterImageGlobalsName, IRB.getVoidTy(), IntptrTy, nullptr)); +          kAsanRegisterImageGlobalsName, IRB.getVoidTy(), IntptrTy));    AsanRegisterImageGlobals->setLinkage(Function::ExternalLinkage);    AsanUnregisterImageGlobals =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          kAsanUnregisterImageGlobalsName, IRB.getVoidTy(), IntptrTy, nullptr)); +          kAsanUnregisterImageGlobalsName, IRB.getVoidTy(), IntptrTy));    AsanUnregisterImageGlobals->setLinkage(Function::ExternalLinkage);  } @@ -1618,11 +1625,12 @@ void AddressSanitizerModule::SetComdatForGlobalMetadata(  GlobalVariable *  AddressSanitizerModule::CreateMetadataGlobal(Module &M, Constant *Initializer,                                               StringRef OriginalName) { -  GlobalVariable *Metadata = -      new GlobalVariable(M, Initializer->getType(), false, -                         GlobalVariable::InternalLinkage, Initializer, -                         Twine("__asan_global_") + -                             GlobalValue::getRealLinkageName(OriginalName)); +  auto Linkage = TargetTriple.isOSBinFormatMachO() +                     ? GlobalVariable::InternalLinkage +                     : GlobalVariable::PrivateLinkage; +  GlobalVariable *Metadata = new GlobalVariable( +      M, Initializer->getType(), false, Linkage, Initializer, +      Twine("__asan_global_") + GlobalValue::getRealLinkageName(OriginalName));    Metadata->setSection(getGlobalMetadataSection());    return Metadata;  } @@ -1862,7 +1870,8 @@ bool AddressSanitizerModule::InstrumentGlobals(IRBuilder<> &IRB, Module &M) {      GlobalValue *InstrumentedGlobal = NewGlobal;      bool CanUsePrivateAliases = -        TargetTriple.isOSBinFormatELF() || TargetTriple.isOSBinFormatMachO(); +        TargetTriple.isOSBinFormatELF() || TargetTriple.isOSBinFormatMachO() || +        TargetTriple.isOSBinFormatWasm();      if (CanUsePrivateAliases && ClUsePrivateAliasForGlobals) {        // Create local alias for NewGlobal to avoid crash on ODR between        // instrumented and non-instrumented libraries. @@ -1926,13 +1935,19 @@ bool AddressSanitizerModule::runOnModule(Module &M) {    Mapping = getShadowMapping(TargetTriple, LongSize, CompileKernel);    initializeCallbacks(M); -  bool Changed = false; +  if (CompileKernel) +    return false; + +  Function *AsanCtorFunction; +  std::tie(AsanCtorFunction, std::ignore) = createSanitizerCtorAndInitFunctions( +      M, kAsanModuleCtorName, kAsanInitName, /*InitArgTypes=*/{}, +      /*InitArgs=*/{}, kAsanVersionCheckName); +  appendToGlobalCtors(M, AsanCtorFunction, kAsanCtorAndDtorPriority); +  bool Changed = false;    // TODO(glider): temporarily disabled globals instrumentation for KASan. -  if (ClGlobals && !CompileKernel) { -    Function *CtorFunc = M.getFunction(kAsanModuleCtorName); -    assert(CtorFunc); -    IRBuilder<> IRB(CtorFunc->getEntryBlock().getTerminator()); +  if (ClGlobals) { +    IRBuilder<> IRB(AsanCtorFunction->getEntryBlock().getTerminator());      Changed |= InstrumentGlobals(IRB, M);    } @@ -1949,49 +1964,60 @@ void AddressSanitizer::initializeCallbacks(Module &M) {        const std::string ExpStr = Exp ? "exp_" : "";        const std::string SuffixStr = CompileKernel ? "N" : "_n";        const std::string EndingStr = Recover ? "_noabort" : ""; -      Type *ExpType = Exp ? Type::getInt32Ty(*C) : nullptr; -      AsanErrorCallbackSized[AccessIsWrite][Exp] = -          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -              kAsanReportErrorTemplate + ExpStr + TypeStr + SuffixStr + EndingStr, -              IRB.getVoidTy(), IntptrTy, IntptrTy, ExpType, nullptr)); -      AsanMemoryAccessCallbackSized[AccessIsWrite][Exp] = -          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -              ClMemoryAccessCallbackPrefix + ExpStr + TypeStr + "N" + EndingStr, -              IRB.getVoidTy(), IntptrTy, IntptrTy, ExpType, nullptr)); -      for (size_t AccessSizeIndex = 0; AccessSizeIndex < kNumberOfAccessSizes; -           AccessSizeIndex++) { -        const std::string Suffix = TypeStr + itostr(1ULL << AccessSizeIndex); -        AsanErrorCallback[AccessIsWrite][Exp][AccessSizeIndex] = -            checkSanitizerInterfaceFunction(M.getOrInsertFunction( -                kAsanReportErrorTemplate + ExpStr + Suffix + EndingStr, -                IRB.getVoidTy(), IntptrTy, ExpType, nullptr)); -        AsanMemoryAccessCallback[AccessIsWrite][Exp][AccessSizeIndex] = -            checkSanitizerInterfaceFunction(M.getOrInsertFunction( -                ClMemoryAccessCallbackPrefix + ExpStr + Suffix + EndingStr, -                IRB.getVoidTy(), IntptrTy, ExpType, nullptr)); + +      SmallVector<Type *, 3> Args2 = {IntptrTy, IntptrTy}; +      SmallVector<Type *, 2> Args1{1, IntptrTy}; +      if (Exp) { +        Type *ExpType = Type::getInt32Ty(*C); +        Args2.push_back(ExpType); +        Args1.push_back(ExpType);        } -    } +	    AsanErrorCallbackSized[AccessIsWrite][Exp] = +	        checkSanitizerInterfaceFunction(M.getOrInsertFunction( +	            kAsanReportErrorTemplate + ExpStr + TypeStr + SuffixStr + +	                EndingStr, +	            FunctionType::get(IRB.getVoidTy(), Args2, false))); + +	    AsanMemoryAccessCallbackSized[AccessIsWrite][Exp] = +	        checkSanitizerInterfaceFunction(M.getOrInsertFunction( +	            ClMemoryAccessCallbackPrefix + ExpStr + TypeStr + "N" + EndingStr, +	            FunctionType::get(IRB.getVoidTy(), Args2, false))); + +	    for (size_t AccessSizeIndex = 0; AccessSizeIndex < kNumberOfAccessSizes; +	         AccessSizeIndex++) { +	      const std::string Suffix = TypeStr + itostr(1ULL << AccessSizeIndex); +	      AsanErrorCallback[AccessIsWrite][Exp][AccessSizeIndex] = +	          checkSanitizerInterfaceFunction(M.getOrInsertFunction( +	              kAsanReportErrorTemplate + ExpStr + Suffix + EndingStr, +	              FunctionType::get(IRB.getVoidTy(), Args1, false))); + +	      AsanMemoryAccessCallback[AccessIsWrite][Exp][AccessSizeIndex] = +	          checkSanitizerInterfaceFunction(M.getOrInsertFunction( +	              ClMemoryAccessCallbackPrefix + ExpStr + Suffix + EndingStr, +	              FunctionType::get(IRB.getVoidTy(), Args1, false))); +	    } +	  }    }    const std::string MemIntrinCallbackPrefix =        CompileKernel ? std::string("") : ClMemoryAccessCallbackPrefix;    AsanMemmove = checkSanitizerInterfaceFunction(M.getOrInsertFunction(        MemIntrinCallbackPrefix + "memmove", IRB.getInt8PtrTy(), -      IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), IntptrTy, nullptr)); +      IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), IntptrTy));    AsanMemcpy = checkSanitizerInterfaceFunction(M.getOrInsertFunction(        MemIntrinCallbackPrefix + "memcpy", IRB.getInt8PtrTy(), -      IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), IntptrTy, nullptr)); +      IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), IntptrTy));    AsanMemset = checkSanitizerInterfaceFunction(M.getOrInsertFunction(        MemIntrinCallbackPrefix + "memset", IRB.getInt8PtrTy(), -      IRB.getInt8PtrTy(), IRB.getInt32Ty(), IntptrTy, nullptr)); +      IRB.getInt8PtrTy(), IRB.getInt32Ty(), IntptrTy));    AsanHandleNoReturnFunc = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction(kAsanHandleNoReturnName, IRB.getVoidTy(), nullptr)); +      M.getOrInsertFunction(kAsanHandleNoReturnName, IRB.getVoidTy()));    AsanPtrCmpFunction = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      kAsanPtrCmp, IRB.getVoidTy(), IntptrTy, IntptrTy, nullptr)); +      kAsanPtrCmp, IRB.getVoidTy(), IntptrTy, IntptrTy));    AsanPtrSubFunction = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      kAsanPtrSub, IRB.getVoidTy(), IntptrTy, IntptrTy, nullptr)); +      kAsanPtrSub, IRB.getVoidTy(), IntptrTy, IntptrTy));    // We insert an empty inline asm after __asan_report* to avoid callback merge.    EmptyAsm = InlineAsm::get(FunctionType::get(IRB.getVoidTy(), false),                              StringRef(""), StringRef(""), @@ -2001,7 +2027,6 @@ void AddressSanitizer::initializeCallbacks(Module &M) {  // virtual  bool AddressSanitizer::doInitialization(Module &M) {    // Initialize the private fields. No one has accessed them before. -    GlobalsMD.init(M);    C = &(M.getContext()); @@ -2009,13 +2034,6 @@ bool AddressSanitizer::doInitialization(Module &M) {    IntptrTy = Type::getIntNTy(*C, LongSize);    TargetTriple = Triple(M.getTargetTriple()); -  if (!CompileKernel) { -    std::tie(AsanCtorFunction, AsanInitFunction) = -        createSanitizerCtorAndInitFunctions( -            M, kAsanModuleCtorName, kAsanInitName, -            /*InitArgTypes=*/{}, /*InitArgs=*/{}, kAsanVersionCheckName); -    appendToGlobalCtors(M, AsanCtorFunction, kAsanCtorAndDtorPriority); -  }    Mapping = getShadowMapping(TargetTriple, LongSize, CompileKernel);    return true;  } @@ -2034,6 +2052,8 @@ bool AddressSanitizer::maybeInsertAsanInitAtFunctionEntry(Function &F) {    // We cannot just ignore these methods, because they may call other    // instrumented functions.    if (F.getName().find(" load]") != std::string::npos) { +    Function *AsanInitFunction = +        declareSanitizerInitFunction(*F.getParent(), kAsanInitName, {});      IRBuilder<> IRB(&F.front(), F.front().begin());      IRB.CreateCall(AsanInitFunction, {});      return true; @@ -2081,7 +2101,6 @@ void AddressSanitizer::markEscapedLocalAllocas(Function &F) {  }  bool AddressSanitizer::runOnFunction(Function &F) { -  if (&F == AsanCtorFunction) return false;    if (F.getLinkage() == GlobalValue::AvailableExternallyLinkage) return false;    if (!ClDebugFunc.empty() && ClDebugFunc == F.getName()) return false;    if (F.getName().startswith("__asan_")) return false; @@ -2175,8 +2194,9 @@ bool AddressSanitizer::runOnFunction(Function &F) {        (ClInstrumentationWithCallsThreshold >= 0 &&         ToInstrument.size() > (unsigned)ClInstrumentationWithCallsThreshold);    const DataLayout &DL = F.getParent()->getDataLayout(); -  ObjectSizeOffsetVisitor ObjSizeVis(DL, TLI, F.getContext(), -                                     /*RoundToAlign=*/true); +  ObjectSizeOpts ObjSizeOpts; +  ObjSizeOpts.RoundToAlign = true; +  ObjectSizeOffsetVisitor ObjSizeVis(DL, TLI, F.getContext(), ObjSizeOpts);    // Instrument.    int NumInstrumented = 0; @@ -2234,18 +2254,18 @@ void FunctionStackPoisoner::initializeCallbacks(Module &M) {      std::string Suffix = itostr(i);      AsanStackMallocFunc[i] = checkSanitizerInterfaceFunction(          M.getOrInsertFunction(kAsanStackMallocNameTemplate + Suffix, IntptrTy, -                              IntptrTy, nullptr)); +                              IntptrTy));      AsanStackFreeFunc[i] = checkSanitizerInterfaceFunction(          M.getOrInsertFunction(kAsanStackFreeNameTemplate + Suffix, -                              IRB.getVoidTy(), IntptrTy, IntptrTy, nullptr)); +                              IRB.getVoidTy(), IntptrTy, IntptrTy));    }    if (ASan.UseAfterScope) {      AsanPoisonStackMemoryFunc = checkSanitizerInterfaceFunction(          M.getOrInsertFunction(kAsanPoisonStackMemoryName, IRB.getVoidTy(), -                              IntptrTy, IntptrTy, nullptr)); +                              IntptrTy, IntptrTy));      AsanUnpoisonStackMemoryFunc = checkSanitizerInterfaceFunction(          M.getOrInsertFunction(kAsanUnpoisonStackMemoryName, IRB.getVoidTy(), -                              IntptrTy, IntptrTy, nullptr)); +                              IntptrTy, IntptrTy));    }    for (size_t Val : {0x00, 0xf1, 0xf2, 0xf3, 0xf5, 0xf8}) { @@ -2254,14 +2274,14 @@ void FunctionStackPoisoner::initializeCallbacks(Module &M) {      Name << std::setw(2) << std::setfill('0') << std::hex << Val;      AsanSetShadowFunc[Val] =          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -            Name.str(), IRB.getVoidTy(), IntptrTy, IntptrTy, nullptr)); +            Name.str(), IRB.getVoidTy(), IntptrTy, IntptrTy));    }    AsanAllocaPoisonFunc = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      kAsanAllocaPoison, IRB.getVoidTy(), IntptrTy, IntptrTy, nullptr)); +      kAsanAllocaPoison, IRB.getVoidTy(), IntptrTy, IntptrTy));    AsanAllocasUnpoisonFunc =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          kAsanAllocasUnpoison, IRB.getVoidTy(), IntptrTy, IntptrTy, nullptr)); +          kAsanAllocasUnpoison, IRB.getVoidTy(), IntptrTy, IntptrTy));  }  void FunctionStackPoisoner::copyToShadowInline(ArrayRef<uint8_t> ShadowMask, diff --git a/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp b/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp index b34d5b8c45a7..4e454f0c95b6 100644 --- a/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp +++ b/lib/Transforms/Instrumentation/DataFlowSanitizer.cpp @@ -254,7 +254,7 @@ class DataFlowSanitizer : public ModulePass {    MDNode *ColdCallWeights;    DFSanABIList ABIList;    DenseMap<Value *, Function *> UnwrappedFnMap; -  AttributeSet ReadOnlyNoneAttrs; +  AttributeList ReadOnlyNoneAttrs;    bool DFSanRuntimeShadowMask;    Value *getShadowAddress(Value *Addr, Instruction *Pos); @@ -331,6 +331,10 @@ class DFSanVisitor : public InstVisitor<DFSanVisitor> {    DFSanFunction &DFSF;    DFSanVisitor(DFSanFunction &DFSF) : DFSF(DFSF) {} +  const DataLayout &getDataLayout() const { +    return DFSF.F->getParent()->getDataLayout(); +  } +    void visitOperandShadowInst(Instruction &I);    void visitBinaryOperator(BinaryOperator &BO); @@ -539,16 +543,17 @@ DataFlowSanitizer::buildWrapperFunction(Function *F, StringRef NewFName,                                      F->getParent());    NewF->copyAttributesFrom(F);    NewF->removeAttributes( -    AttributeSet::ReturnIndex, -    AttributeSet::get(F->getContext(), AttributeSet::ReturnIndex, -                    AttributeFuncs::typeIncompatible(NewFT->getReturnType()))); +      AttributeList::ReturnIndex, +      AttributeList::get( +          F->getContext(), AttributeList::ReturnIndex, +          AttributeFuncs::typeIncompatible(NewFT->getReturnType())));    BasicBlock *BB = BasicBlock::Create(*Ctx, "entry", NewF);    if (F->isVarArg()) {      NewF->removeAttributes( -        AttributeSet::FunctionIndex, -        AttributeSet().addAttribute(*Ctx, AttributeSet::FunctionIndex, -                                    "split-stack")); +        AttributeList::FunctionIndex, +        AttributeList().addAttribute(*Ctx, AttributeList::FunctionIndex, +                                     "split-stack"));      CallInst::Create(DFSanVarargWrapperFn,                       IRBuilder<>(BB).CreateGlobalStringPtr(F->getName()), "",                       BB); @@ -580,8 +585,7 @@ Constant *DataFlowSanitizer::getOrBuildTrampolineFunction(FunctionType *FT,      Function::arg_iterator AI = F->arg_begin(); ++AI;      for (unsigned N = FT->getNumParams(); N != 0; ++AI, --N)        Args.push_back(&*AI); -    CallInst *CI = -        CallInst::Create(&F->getArgumentList().front(), Args, "", BB); +    CallInst *CI = CallInst::Create(&*F->arg_begin(), Args, "", BB);      ReturnInst *RI;      if (FT->getReturnType()->isVoidTy())        RI = ReturnInst::Create(*Ctx, BB); @@ -595,7 +599,7 @@ Constant *DataFlowSanitizer::getOrBuildTrampolineFunction(FunctionType *FT,      DFSanVisitor(DFSF).visitCallInst(*CI);      if (!FT->getReturnType()->isVoidTy())        new StoreInst(DFSF.getShadow(RI->getReturnValue()), -                    &F->getArgumentList().back(), RI); +                    &*std::prev(F->arg_end()), RI);    }    return C; @@ -622,26 +626,26 @@ bool DataFlowSanitizer::runOnModule(Module &M) {    DFSanUnionFn = Mod->getOrInsertFunction("__dfsan_union", DFSanUnionFnTy);    if (Function *F = dyn_cast<Function>(DFSanUnionFn)) { -    F->addAttribute(AttributeSet::FunctionIndex, Attribute::NoUnwind); -    F->addAttribute(AttributeSet::FunctionIndex, Attribute::ReadNone); -    F->addAttribute(AttributeSet::ReturnIndex, Attribute::ZExt); +    F->addAttribute(AttributeList::FunctionIndex, Attribute::NoUnwind); +    F->addAttribute(AttributeList::FunctionIndex, Attribute::ReadNone); +    F->addAttribute(AttributeList::ReturnIndex, Attribute::ZExt);      F->addAttribute(1, Attribute::ZExt);      F->addAttribute(2, Attribute::ZExt);    }    DFSanCheckedUnionFn = Mod->getOrInsertFunction("dfsan_union", DFSanUnionFnTy);    if (Function *F = dyn_cast<Function>(DFSanCheckedUnionFn)) { -    F->addAttribute(AttributeSet::FunctionIndex, Attribute::NoUnwind); -    F->addAttribute(AttributeSet::FunctionIndex, Attribute::ReadNone); -    F->addAttribute(AttributeSet::ReturnIndex, Attribute::ZExt); +    F->addAttribute(AttributeList::FunctionIndex, Attribute::NoUnwind); +    F->addAttribute(AttributeList::FunctionIndex, Attribute::ReadNone); +    F->addAttribute(AttributeList::ReturnIndex, Attribute::ZExt);      F->addAttribute(1, Attribute::ZExt);      F->addAttribute(2, Attribute::ZExt);    }    DFSanUnionLoadFn =        Mod->getOrInsertFunction("__dfsan_union_load", DFSanUnionLoadFnTy);    if (Function *F = dyn_cast<Function>(DFSanUnionLoadFn)) { -    F->addAttribute(AttributeSet::FunctionIndex, Attribute::NoUnwind); -    F->addAttribute(AttributeSet::FunctionIndex, Attribute::ReadOnly); -    F->addAttribute(AttributeSet::ReturnIndex, Attribute::ZExt); +    F->addAttribute(AttributeList::FunctionIndex, Attribute::NoUnwind); +    F->addAttribute(AttributeList::FunctionIndex, Attribute::ReadOnly); +    F->addAttribute(AttributeList::ReturnIndex, Attribute::ZExt);    }    DFSanUnimplementedFn =        Mod->getOrInsertFunction("__dfsan_unimplemented", DFSanUnimplementedFnTy); @@ -696,7 +700,7 @@ bool DataFlowSanitizer::runOnModule(Module &M) {    AttrBuilder B;    B.addAttribute(Attribute::ReadOnly).addAttribute(Attribute::ReadNone); -  ReadOnlyNoneAttrs = AttributeSet::get(*Ctx, AttributeSet::FunctionIndex, B); +  ReadOnlyNoneAttrs = AttributeList::get(*Ctx, AttributeList::FunctionIndex, B);    // First, change the ABI of every function in the module.  ABI-listed    // functions keep their original ABI and get a wrapper function. @@ -717,9 +721,10 @@ bool DataFlowSanitizer::runOnModule(Module &M) {          Function *NewF = Function::Create(NewFT, F.getLinkage(), "", &M);          NewF->copyAttributesFrom(&F);          NewF->removeAttributes( -          AttributeSet::ReturnIndex, -          AttributeSet::get(NewF->getContext(), AttributeSet::ReturnIndex, -                    AttributeFuncs::typeIncompatible(NewFT->getReturnType()))); +            AttributeList::ReturnIndex, +            AttributeList::get( +                NewF->getContext(), AttributeList::ReturnIndex, +                AttributeFuncs::typeIncompatible(NewFT->getReturnType())));          for (Function::arg_iterator FArg = F.arg_begin(),                                      NewFArg = NewF->arg_begin(),                                      FArgEnd = F.arg_end(); @@ -758,7 +763,7 @@ bool DataFlowSanitizer::runOnModule(Module &M) {            &F, std::string("dfsw$") + std::string(F.getName()),            GlobalValue::LinkOnceODRLinkage, NewFT);        if (getInstrumentedABI() == IA_TLS) -        NewF->removeAttributes(AttributeSet::FunctionIndex, ReadOnlyNoneAttrs); +        NewF->removeAttributes(AttributeList::FunctionIndex, ReadOnlyNoneAttrs);        Value *WrappedFnCst =            ConstantExpr::getBitCast(NewF, PointerType::getUnqual(FT)); @@ -906,7 +911,7 @@ Value *DFSanFunction::getShadow(Value *V) {          break;        }        case DataFlowSanitizer::IA_Args: { -        unsigned ArgIdx = A->getArgNo() + F->getArgumentList().size() / 2; +        unsigned ArgIdx = A->getArgNo() + F->arg_size() / 2;          Function::arg_iterator i = F->arg_begin();          while (ArgIdx--)            ++i; @@ -983,7 +988,7 @@ Value *DFSanFunction::combineShadows(Value *V1, Value *V2, Instruction *Pos) {    IRBuilder<> IRB(Pos);    if (AvoidNewBlocks) {      CallInst *Call = IRB.CreateCall(DFS.DFSanCheckedUnionFn, {V1, V2}); -    Call->addAttribute(AttributeSet::ReturnIndex, Attribute::ZExt); +    Call->addAttribute(AttributeList::ReturnIndex, Attribute::ZExt);      Call->addAttribute(1, Attribute::ZExt);      Call->addAttribute(2, Attribute::ZExt); @@ -996,7 +1001,7 @@ Value *DFSanFunction::combineShadows(Value *V1, Value *V2, Instruction *Pos) {          Ne, Pos, /*Unreachable=*/false, DFS.ColdCallWeights, &DT));      IRBuilder<> ThenIRB(BI);      CallInst *Call = ThenIRB.CreateCall(DFS.DFSanUnionFn, {V1, V2}); -    Call->addAttribute(AttributeSet::ReturnIndex, Attribute::ZExt); +    Call->addAttribute(AttributeList::ReturnIndex, Attribute::ZExt);      Call->addAttribute(1, Attribute::ZExt);      Call->addAttribute(2, Attribute::ZExt); @@ -1099,7 +1104,7 @@ Value *DFSanFunction::loadShadow(Value *Addr, uint64_t Size, uint64_t Align,      CallInst *FallbackCall = FallbackIRB.CreateCall(          DFS.DFSanUnionLoadFn,          {ShadowAddr, ConstantInt::get(DFS.IntptrTy, Size)}); -    FallbackCall->addAttribute(AttributeSet::ReturnIndex, Attribute::ZExt); +    FallbackCall->addAttribute(AttributeList::ReturnIndex, Attribute::ZExt);      // Compare each of the shadows stored in the loaded 64 bits to each other,      // by computing (WideShadow rotl ShadowWidth) == WideShadow. @@ -1156,7 +1161,7 @@ Value *DFSanFunction::loadShadow(Value *Addr, uint64_t Size, uint64_t Align,    IRBuilder<> IRB(Pos);    CallInst *FallbackCall = IRB.CreateCall(        DFS.DFSanUnionLoadFn, {ShadowAddr, ConstantInt::get(DFS.IntptrTy, Size)}); -  FallbackCall->addAttribute(AttributeSet::ReturnIndex, Attribute::ZExt); +  FallbackCall->addAttribute(AttributeList::ReturnIndex, Attribute::ZExt);    return FallbackCall;  } @@ -1446,7 +1451,7 @@ void DFSanVisitor::visitCallSite(CallSite CS) {            // Custom functions returning non-void will write to the return label.            if (!FT->getReturnType()->isVoidTy()) { -            CustomFn->removeAttributes(AttributeSet::FunctionIndex, +            CustomFn->removeAttributes(AttributeList::FunctionIndex,                                         DFSF.DFS.ReadOnlyNoneAttrs);            }          } @@ -1481,7 +1486,8 @@ void DFSanVisitor::visitCallSite(CallSite CS) {            auto *LabelVATy = ArrayType::get(DFSF.DFS.ShadowTy,                                             CS.arg_size() - FT->getNumParams());            auto *LabelVAAlloca = new AllocaInst( -              LabelVATy, "labelva", &DFSF.F->getEntryBlock().front()); +              LabelVATy, getDataLayout().getAllocaAddrSpace(), +              "labelva", &DFSF.F->getEntryBlock().front());            for (unsigned n = 0; i != CS.arg_end(); ++i, ++n) {              auto LabelVAPtr = IRB.CreateStructGEP(LabelVATy, LabelVAAlloca, n); @@ -1494,8 +1500,9 @@ void DFSanVisitor::visitCallSite(CallSite CS) {          if (!FT->getReturnType()->isVoidTy()) {            if (!DFSF.LabelReturnAlloca) {              DFSF.LabelReturnAlloca = -                new AllocaInst(DFSF.DFS.ShadowTy, "labelreturn", -                               &DFSF.F->getEntryBlock().front()); +              new AllocaInst(DFSF.DFS.ShadowTy, +                             getDataLayout().getAllocaAddrSpace(), +                             "labelreturn", &DFSF.F->getEntryBlock().front());            }            Args.push_back(DFSF.LabelReturnAlloca);          } @@ -1574,7 +1581,8 @@ void DFSanVisitor::visitCallSite(CallSite CS) {        unsigned VarArgSize = CS.arg_size() - FT->getNumParams();        ArrayType *VarArgArrayTy = ArrayType::get(DFSF.DFS.ShadowTy, VarArgSize);        AllocaInst *VarArgShadow = -          new AllocaInst(VarArgArrayTy, "", &DFSF.F->getEntryBlock().front()); +        new AllocaInst(VarArgArrayTy, getDataLayout().getAllocaAddrSpace(), +                       "", &DFSF.F->getEntryBlock().front());        Args.push_back(IRB.CreateConstGEP2_32(VarArgArrayTy, VarArgShadow, 0, 0));        for (unsigned n = 0; i != e; ++i, ++n) {          IRB.CreateStore( @@ -1593,7 +1601,7 @@ void DFSanVisitor::visitCallSite(CallSite CS) {      }      NewCS.setCallingConv(CS.getCallingConv());      NewCS.setAttributes(CS.getAttributes().removeAttributes( -        *DFSF.DFS.Ctx, AttributeSet::ReturnIndex, +        *DFSF.DFS.Ctx, AttributeList::ReturnIndex,          AttributeFuncs::typeIncompatible(NewCS.getInstruction()->getType())));      if (Next) { diff --git a/lib/Transforms/Instrumentation/EfficiencySanitizer.cpp b/lib/Transforms/Instrumentation/EfficiencySanitizer.cpp index 05eba6c4dc69..7dea1dee756a 100644 --- a/lib/Transforms/Instrumentation/EfficiencySanitizer.cpp +++ b/lib/Transforms/Instrumentation/EfficiencySanitizer.cpp @@ -267,35 +267,35 @@ void EfficiencySanitizer::initializeCallbacks(Module &M) {      SmallString<32> AlignedLoadName("__esan_aligned_load" + ByteSizeStr);      EsanAlignedLoad[Idx] =          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -            AlignedLoadName, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +            AlignedLoadName, IRB.getVoidTy(), IRB.getInt8PtrTy()));      SmallString<32> AlignedStoreName("__esan_aligned_store" + ByteSizeStr);      EsanAlignedStore[Idx] =          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -            AlignedStoreName, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +            AlignedStoreName, IRB.getVoidTy(), IRB.getInt8PtrTy()));      SmallString<32> UnalignedLoadName("__esan_unaligned_load" + ByteSizeStr);      EsanUnalignedLoad[Idx] =          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -            UnalignedLoadName, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +            UnalignedLoadName, IRB.getVoidTy(), IRB.getInt8PtrTy()));      SmallString<32> UnalignedStoreName("__esan_unaligned_store" + ByteSizeStr);      EsanUnalignedStore[Idx] =          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -            UnalignedStoreName, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +            UnalignedStoreName, IRB.getVoidTy(), IRB.getInt8PtrTy()));    }    EsanUnalignedLoadN = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("__esan_unaligned_loadN", IRB.getVoidTy(), -                            IRB.getInt8PtrTy(), IntptrTy, nullptr)); +                            IRB.getInt8PtrTy(), IntptrTy));    EsanUnalignedStoreN = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("__esan_unaligned_storeN", IRB.getVoidTy(), -                            IRB.getInt8PtrTy(), IntptrTy, nullptr)); +                            IRB.getInt8PtrTy(), IntptrTy));    MemmoveFn = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("memmove", IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -                            IRB.getInt8PtrTy(), IntptrTy, nullptr)); +                            IRB.getInt8PtrTy(), IntptrTy));    MemcpyFn = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("memcpy", IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -                            IRB.getInt8PtrTy(), IntptrTy, nullptr)); +                            IRB.getInt8PtrTy(), IntptrTy));    MemsetFn = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("memset", IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -                            IRB.getInt32Ty(), IntptrTy, nullptr)); +                            IRB.getInt32Ty(), IntptrTy));  }  bool EfficiencySanitizer::shouldIgnoreStructType(StructType *StructTy) { @@ -533,7 +533,7 @@ void EfficiencySanitizer::createDestructor(Module &M, Constant *ToolInfoArg) {    IRBuilder<> IRB_Dtor(EsanDtorFunction->getEntryBlock().getTerminator());    Function *EsanExit = checkSanitizerInterfaceFunction(        M.getOrInsertFunction(EsanExitName, IRB_Dtor.getVoidTy(), -                            Int8PtrTy, nullptr)); +                            Int8PtrTy));    EsanExit->setLinkage(Function::ExternalLinkage);    IRB_Dtor.CreateCall(EsanExit, {ToolInfoArg});    appendToGlobalDtors(M, EsanDtorFunction, EsanCtorAndDtorPriority); @@ -757,7 +757,7 @@ bool EfficiencySanitizer::instrumentGetElementPtr(Instruction *I, Module &M) {      return false;    }    Type *SourceTy = GepInst->getSourceElementType(); -  StructType *StructTy; +  StructType *StructTy = nullptr;    ConstantInt *Idx;    // Check if GEP calculates address from a struct array.    if (isa<StructType>(SourceTy)) { diff --git a/lib/Transforms/Instrumentation/IndirectCallPromotion.cpp b/lib/Transforms/Instrumentation/IndirectCallPromotion.cpp index 1ba13bdfe05a..61d627673c90 100644 --- a/lib/Transforms/Instrumentation/IndirectCallPromotion.cpp +++ b/lib/Transforms/Instrumentation/IndirectCallPromotion.cpp @@ -1,4 +1,4 @@ -//===-- IndirectCallPromotion.cpp - Promote indirect calls to direct calls ===// +//===-- IndirectCallPromotion.cpp - Optimizations based on value profiling ===//  //  //                      The LLVM Compiler Infrastructure  // @@ -17,6 +17,8 @@  #include "llvm/ADT/Statistic.h"  #include "llvm/ADT/StringRef.h"  #include "llvm/ADT/Twine.h" +#include "llvm/Analysis/BlockFrequencyInfo.h" +#include "llvm/Analysis/GlobalsModRef.h"  #include "llvm/Analysis/IndirectCallPromotionAnalysis.h"  #include "llvm/Analysis/IndirectCallSiteVisitor.h"  #include "llvm/IR/BasicBlock.h" @@ -40,6 +42,7 @@  #include "llvm/Support/CommandLine.h"  #include "llvm/Support/Debug.h"  #include "llvm/Support/ErrorHandling.h" +#include "llvm/Support/MathExtras.h"  #include "llvm/Transforms/Instrumentation.h"  #include "llvm/Transforms/PGOInstrumentation.h"  #include "llvm/Transforms/Utils/BasicBlockUtils.h" @@ -53,6 +56,8 @@ using namespace llvm;  STATISTIC(NumOfPGOICallPromotion, "Number of indirect call promotions.");  STATISTIC(NumOfPGOICallsites, "Number of indirect call candidate sites."); +STATISTIC(NumOfPGOMemOPOpt, "Number of memop intrinsics optimized."); +STATISTIC(NumOfPGOMemOPAnnotate, "Number of memop intrinsics annotated.");  // Command line option to disable indirect-call promotion with the default as  // false. This is for debug purpose. @@ -80,6 +85,12 @@ static cl::opt<bool> ICPLTOMode("icp-lto", cl::init(false), cl::Hidden,                                  cl::desc("Run indirect-call promotion in LTO "                                           "mode")); +// Set if the pass is called in SamplePGO mode. The difference for SamplePGO +// mode is it will add prof metadatato the created direct call. +static cl::opt<bool> +    ICPSamplePGOMode("icp-samplepgo", cl::init(false), cl::Hidden, +                     cl::desc("Run indirect-call promotion in SamplePGO mode")); +  // If the option is set to true, only call instructions will be considered for  // transformation -- invoke instructions will be ignored.  static cl::opt<bool> @@ -100,13 +111,51 @@ static cl::opt<bool>      ICPDUMPAFTER("icp-dumpafter", cl::init(false), cl::Hidden,                   cl::desc("Dump IR after transformation happens")); +// The minimum call count to optimize memory intrinsic calls. +static cl::opt<unsigned> +    MemOPCountThreshold("pgo-memop-count-threshold", cl::Hidden, cl::ZeroOrMore, +                        cl::init(1000), +                        cl::desc("The minimum count to optimize memory " +                                 "intrinsic calls")); + +// Command line option to disable memory intrinsic optimization. The default is +// false. This is for debug purpose. +static cl::opt<bool> DisableMemOPOPT("disable-memop-opt", cl::init(false), +                                     cl::Hidden, cl::desc("Disable optimize")); + +// The percent threshold to optimize memory intrinsic calls. +static cl::opt<unsigned> +    MemOPPercentThreshold("pgo-memop-percent-threshold", cl::init(40), +                          cl::Hidden, cl::ZeroOrMore, +                          cl::desc("The percentage threshold for the " +                                   "memory intrinsic calls optimization")); + +// Maximum number of versions for optimizing memory intrinsic call. +static cl::opt<unsigned> +    MemOPMaxVersion("pgo-memop-max-version", cl::init(3), cl::Hidden, +                    cl::ZeroOrMore, +                    cl::desc("The max version for the optimized memory " +                             " intrinsic calls")); + +// Scale the counts from the annotation using the BB count value. +static cl::opt<bool> +    MemOPScaleCount("pgo-memop-scale-count", cl::init(true), cl::Hidden, +                    cl::desc("Scale the memop size counts using the basic " +                             " block count value")); + +// This option sets the rangge of precise profile memop sizes. +extern cl::opt<std::string> MemOPSizeRange; + +// This option sets the value that groups large memop sizes +extern cl::opt<unsigned> MemOPSizeLarge; +  namespace {  class PGOIndirectCallPromotionLegacyPass : public ModulePass {  public:    static char ID; -  PGOIndirectCallPromotionLegacyPass(bool InLTO = false) -      : ModulePass(ID), InLTO(InLTO) { +  PGOIndirectCallPromotionLegacyPass(bool InLTO = false, bool SamplePGO = false) +      : ModulePass(ID), InLTO(InLTO), SamplePGO(SamplePGO) {      initializePGOIndirectCallPromotionLegacyPassPass(          *PassRegistry::getPassRegistry());    } @@ -119,6 +168,28 @@ private:    // If this pass is called in LTO. We need to special handling the PGOFuncName    // for the static variables due to LTO's internalization.    bool InLTO; + +  // If this pass is called in SamplePGO. We need to add the prof metadata to +  // the promoted direct call. +  bool SamplePGO; +}; + +class PGOMemOPSizeOptLegacyPass : public FunctionPass { +public: +  static char ID; + +  PGOMemOPSizeOptLegacyPass() : FunctionPass(ID) { +    initializePGOMemOPSizeOptLegacyPassPass(*PassRegistry::getPassRegistry()); +  } + +  StringRef getPassName() const override { return "PGOMemOPSize"; } + +private: +  bool runOnFunction(Function &F) override; +  void getAnalysisUsage(AnalysisUsage &AU) const override { +    AU.addRequired<BlockFrequencyInfoWrapperPass>(); +    AU.addPreserved<GlobalsAAWrapperPass>(); +  }  };  } // end anonymous namespace @@ -128,8 +199,22 @@ INITIALIZE_PASS(PGOIndirectCallPromotionLegacyPass, "pgo-icall-prom",                  "direct calls.",                  false, false) -ModulePass *llvm::createPGOIndirectCallPromotionLegacyPass(bool InLTO) { -  return new PGOIndirectCallPromotionLegacyPass(InLTO); +ModulePass *llvm::createPGOIndirectCallPromotionLegacyPass(bool InLTO, +                                                           bool SamplePGO) { +  return new PGOIndirectCallPromotionLegacyPass(InLTO, SamplePGO); +} + +char PGOMemOPSizeOptLegacyPass::ID = 0; +INITIALIZE_PASS_BEGIN(PGOMemOPSizeOptLegacyPass, "pgo-memop-opt", +                      "Optimize memory intrinsic using its size value profile", +                      false, false) +INITIALIZE_PASS_DEPENDENCY(BlockFrequencyInfoWrapperPass) +INITIALIZE_PASS_END(PGOMemOPSizeOptLegacyPass, "pgo-memop-opt", +                    "Optimize memory intrinsic using its size value profile", +                    false, false) + +FunctionPass *llvm::createPGOMemOPSizeOptLegacyPass() { +  return new PGOMemOPSizeOptLegacyPass();  }  namespace { @@ -144,17 +229,11 @@ private:    // defines.    InstrProfSymtab *Symtab; -  enum TargetStatus { -    OK,                   // Should be able to promote. -    NotAvailableInModule, // Cannot find the target in current module. -    ReturnTypeMismatch,   // Return type mismatch b/w target and indirect-call. -    NumArgsMismatch,      // Number of arguments does not match. -    ArgTypeMismatch       // Type mismatch in the arguments (cannot bitcast). -  }; +  bool SamplePGO;    // Test if we can legally promote this direct-call of Target. -  TargetStatus isPromotionLegal(Instruction *Inst, uint64_t Target, -                                Function *&F); +  bool isPromotionLegal(Instruction *Inst, uint64_t Target, Function *&F, +                        const char **Reason = nullptr);    // A struct that records the direct target and it's call count.    struct PromotionCandidate { @@ -172,91 +251,77 @@ private:        Instruction *Inst, const ArrayRef<InstrProfValueData> &ValueDataRef,        uint64_t TotalCount, uint32_t NumCandidates); -  // Main function that transforms Inst (either a indirect-call instruction, or -  // an invoke instruction , to a conditional call to F. This is like: -  //     if (Inst.CalledValue == F) -  //        F(...); -  //     else -  //        Inst(...); -  //     end -  // TotalCount is the profile count value that the instruction executes. -  // Count is the profile count value that F is the target function. -  // These two values are being used to update the branch weight. -  void promote(Instruction *Inst, Function *F, uint64_t Count, -               uint64_t TotalCount); -    // Promote a list of targets for one indirect-call callsite. Return    // the number of promotions.    uint32_t tryToPromote(Instruction *Inst,                          const std::vector<PromotionCandidate> &Candidates,                          uint64_t &TotalCount); -  static const char *StatusToString(const TargetStatus S) { -    switch (S) { -    case OK: -      return "OK to promote"; -    case NotAvailableInModule: -      return "Cannot find the target"; -    case ReturnTypeMismatch: -      return "Return type mismatch"; -    case NumArgsMismatch: -      return "The number of arguments mismatch"; -    case ArgTypeMismatch: -      return "Argument Type mismatch"; -    } -    llvm_unreachable("Should not reach here"); -  } -    // Noncopyable    ICallPromotionFunc(const ICallPromotionFunc &other) = delete;    ICallPromotionFunc &operator=(const ICallPromotionFunc &other) = delete;  public: -  ICallPromotionFunc(Function &Func, Module *Modu, InstrProfSymtab *Symtab) -      : F(Func), M(Modu), Symtab(Symtab) { -  } +  ICallPromotionFunc(Function &Func, Module *Modu, InstrProfSymtab *Symtab, +                     bool SamplePGO) +      : F(Func), M(Modu), Symtab(Symtab), SamplePGO(SamplePGO) {}    bool processFunction();  };  } // end anonymous namespace -ICallPromotionFunc::TargetStatus -ICallPromotionFunc::isPromotionLegal(Instruction *Inst, uint64_t Target, -                                     Function *&TargetFunction) { -  Function *DirectCallee = Symtab->getFunction(Target); -  if (DirectCallee == nullptr) -    return NotAvailableInModule; +bool llvm::isLegalToPromote(Instruction *Inst, Function *F, +                            const char **Reason) {    // Check the return type.    Type *CallRetType = Inst->getType();    if (!CallRetType->isVoidTy()) { -    Type *FuncRetType = DirectCallee->getReturnType(); +    Type *FuncRetType = F->getReturnType();      if (FuncRetType != CallRetType && -        !CastInst::isBitCastable(FuncRetType, CallRetType)) -      return ReturnTypeMismatch; +        !CastInst::isBitCastable(FuncRetType, CallRetType)) { +      if (Reason) +        *Reason = "Return type mismatch"; +      return false; +    }    }    // Check if the arguments are compatible with the parameters -  FunctionType *DirectCalleeType = DirectCallee->getFunctionType(); +  FunctionType *DirectCalleeType = F->getFunctionType();    unsigned ParamNum = DirectCalleeType->getFunctionNumParams();    CallSite CS(Inst);    unsigned ArgNum = CS.arg_size(); -  if (ParamNum != ArgNum && !DirectCalleeType->isVarArg()) -    return NumArgsMismatch; +  if (ParamNum != ArgNum && !DirectCalleeType->isVarArg()) { +    if (Reason) +      *Reason = "The number of arguments mismatch"; +    return false; +  }    for (unsigned I = 0; I < ParamNum; ++I) {      Type *PTy = DirectCalleeType->getFunctionParamType(I);      Type *ATy = CS.getArgument(I)->getType();      if (PTy == ATy)        continue; -    if (!CastInst::castIsValid(Instruction::BitCast, CS.getArgument(I), PTy)) -      return ArgTypeMismatch; +    if (!CastInst::castIsValid(Instruction::BitCast, CS.getArgument(I), PTy)) { +      if (Reason) +        *Reason = "Argument type mismatch"; +      return false; +    }    }    DEBUG(dbgs() << " #" << NumOfPGOICallPromotion << " Promote the icall to " -               << Symtab->getFuncName(Target) << "\n"); -  TargetFunction = DirectCallee; -  return OK; +               << F->getName() << "\n"); +  return true; +} + +bool ICallPromotionFunc::isPromotionLegal(Instruction *Inst, uint64_t Target, +                                          Function *&TargetFunction, +                                          const char **Reason) { +  TargetFunction = Symtab->getFunction(Target); +  if (TargetFunction == nullptr) { +    *Reason = "Cannot find the target"; +    return false; +  } +  return isLegalToPromote(Inst, TargetFunction, Reason);  }  // Indirect-call promotion heuristic. The direct targets are sorted based on @@ -296,10 +361,9 @@ ICallPromotionFunc::getPromotionCandidatesForCallSite(        break;      }      Function *TargetFunction = nullptr; -    TargetStatus Status = isPromotionLegal(Inst, Target, TargetFunction); -    if (Status != OK) { +    const char *Reason = nullptr; +    if (!isPromotionLegal(Inst, Target, TargetFunction, &Reason)) {        StringRef TargetFuncName = Symtab->getFuncName(Target); -      const char *Reason = StatusToString(Status);        DEBUG(dbgs() << " Not promote: " << Reason << "\n");        emitOptimizationRemarkMissed(            F.getContext(), "pgo-icall-prom", F, Inst->getDebugLoc(), @@ -532,8 +596,14 @@ static void insertCallRetPHI(Instruction *Inst, Instruction *CallResult,  //     Ret = phi(Ret1, Ret2);  // It adds type casts for the args do not match the parameters and the return  // value. Branch weights metadata also updated. -void ICallPromotionFunc::promote(Instruction *Inst, Function *DirectCallee, -                                 uint64_t Count, uint64_t TotalCount) { +// If \p AttachProfToDirectCall is true, a prof metadata is attached to the +// new direct call to contain \p Count. This is used by SamplePGO inliner to +// check callsite hotness. +// Returns the promoted direct call instruction. +Instruction *llvm::promoteIndirectCall(Instruction *Inst, +                                       Function *DirectCallee, uint64_t Count, +                                       uint64_t TotalCount, +                                       bool AttachProfToDirectCall) {    assert(DirectCallee != nullptr);    BasicBlock *BB = Inst->getParent();    // Just to suppress the non-debug build warning. @@ -548,6 +618,14 @@ void ICallPromotionFunc::promote(Instruction *Inst, Function *DirectCallee,    Instruction *NewInst =        createDirectCallInst(Inst, DirectCallee, DirectCallBB, MergeBB); +  if (AttachProfToDirectCall) { +    SmallVector<uint32_t, 1> Weights; +    Weights.push_back(Count); +    MDBuilder MDB(NewInst->getContext()); +    dyn_cast<Instruction>(NewInst->stripPointerCasts()) +        ->setMetadata(LLVMContext::MD_prof, MDB.createBranchWeights(Weights)); +  } +    // Move Inst from MergeBB to IndirectCallBB.    Inst->removeFromParent();    IndirectCallBB->getInstList().insert(IndirectCallBB->getFirstInsertionPt(), @@ -576,9 +654,10 @@ void ICallPromotionFunc::promote(Instruction *Inst, Function *DirectCallee,    DEBUG(dbgs() << *BB << *DirectCallBB << *IndirectCallBB << *MergeBB << "\n");    emitOptimizationRemark( -      F.getContext(), "pgo-icall-prom", F, Inst->getDebugLoc(), +      BB->getContext(), "pgo-icall-prom", *BB->getParent(), Inst->getDebugLoc(),        Twine("Promote indirect call to ") + DirectCallee->getName() +            " with count " + Twine(Count) + " out of " + Twine(TotalCount)); +  return NewInst;  }  // Promote indirect-call to conditional direct-call for one callsite. @@ -589,7 +668,7 @@ uint32_t ICallPromotionFunc::tryToPromote(    for (auto &C : Candidates) {      uint64_t Count = C.Count; -    promote(Inst, C.TargetFunction, Count, TotalCount); +    promoteIndirectCall(Inst, C.TargetFunction, Count, TotalCount, SamplePGO);      assert(TotalCount >= Count);      TotalCount -= Count;      NumOfPGOICallPromotion++; @@ -630,7 +709,7 @@ bool ICallPromotionFunc::processFunction() {  }  // A wrapper function that does the actual work. -static bool promoteIndirectCalls(Module &M, bool InLTO) { +static bool promoteIndirectCalls(Module &M, bool InLTO, bool SamplePGO) {    if (DisableICP)      return false;    InstrProfSymtab Symtab; @@ -641,7 +720,7 @@ static bool promoteIndirectCalls(Module &M, bool InLTO) {        continue;      if (F.hasFnAttribute(Attribute::OptimizeNone))        continue; -    ICallPromotionFunc ICallPromotion(F, &M, &Symtab); +    ICallPromotionFunc ICallPromotion(F, &M, &Symtab, SamplePGO);      bool FuncChanged = ICallPromotion.processFunction();      if (ICPDUMPAFTER && FuncChanged) {        DEBUG(dbgs() << "\n== IR Dump After =="; F.print(dbgs())); @@ -658,12 +737,289 @@ static bool promoteIndirectCalls(Module &M, bool InLTO) {  bool PGOIndirectCallPromotionLegacyPass::runOnModule(Module &M) {    // Command-line option has the priority for InLTO. -  return promoteIndirectCalls(M, InLTO | ICPLTOMode); +  return promoteIndirectCalls(M, InLTO | ICPLTOMode, +                              SamplePGO | ICPSamplePGOMode);  } -PreservedAnalyses PGOIndirectCallPromotion::run(Module &M, ModuleAnalysisManager &AM) { -  if (!promoteIndirectCalls(M, InLTO | ICPLTOMode)) +PreservedAnalyses PGOIndirectCallPromotion::run(Module &M, +                                                ModuleAnalysisManager &AM) { +  if (!promoteIndirectCalls(M, InLTO | ICPLTOMode, +                            SamplePGO | ICPSamplePGOMode))      return PreservedAnalyses::all();    return PreservedAnalyses::none();  } + +namespace { +class MemOPSizeOpt : public InstVisitor<MemOPSizeOpt> { +public: +  MemOPSizeOpt(Function &Func, BlockFrequencyInfo &BFI) +      : Func(Func), BFI(BFI), Changed(false) { +    ValueDataArray = +        llvm::make_unique<InstrProfValueData[]>(MemOPMaxVersion + 2); +    // Get the MemOPSize range information from option MemOPSizeRange, +    getMemOPSizeRangeFromOption(MemOPSizeRange, PreciseRangeStart, +                                PreciseRangeLast); +  } +  bool isChanged() const { return Changed; } +  void perform() { +    WorkList.clear(); +    visit(Func); + +    for (auto &MI : WorkList) { +      ++NumOfPGOMemOPAnnotate; +      if (perform(MI)) { +        Changed = true; +        ++NumOfPGOMemOPOpt; +        DEBUG(dbgs() << "MemOP calls: " << MI->getCalledFunction()->getName() +                     << "is Transformed.\n"); +      } +    } +  } + +  void visitMemIntrinsic(MemIntrinsic &MI) { +    Value *Length = MI.getLength(); +    // Not perform on constant length calls. +    if (dyn_cast<ConstantInt>(Length)) +      return; +    WorkList.push_back(&MI); +  } + +private: +  Function &Func; +  BlockFrequencyInfo &BFI; +  bool Changed; +  std::vector<MemIntrinsic *> WorkList; +  // Start of the previse range. +  int64_t PreciseRangeStart; +  // Last value of the previse range. +  int64_t PreciseRangeLast; +  // The space to read the profile annotation. +  std::unique_ptr<InstrProfValueData[]> ValueDataArray; +  bool perform(MemIntrinsic *MI); + +  // This kind shows which group the value falls in. For PreciseValue, we have +  // the profile count for that value. LargeGroup groups the values that are in +  // range [LargeValue, +inf). NonLargeGroup groups the rest of values. +  enum MemOPSizeKind { PreciseValue, NonLargeGroup, LargeGroup }; + +  MemOPSizeKind getMemOPSizeKind(int64_t Value) const { +    if (Value == MemOPSizeLarge && MemOPSizeLarge != 0) +      return LargeGroup; +    if (Value == PreciseRangeLast + 1) +      return NonLargeGroup; +    return PreciseValue; +  } +}; + +static const char *getMIName(const MemIntrinsic *MI) { +  switch (MI->getIntrinsicID()) { +  case Intrinsic::memcpy: +    return "memcpy"; +  case Intrinsic::memmove: +    return "memmove"; +  case Intrinsic::memset: +    return "memset"; +  default: +    return "unknown"; +  } +} + +static bool isProfitable(uint64_t Count, uint64_t TotalCount) { +  assert(Count <= TotalCount); +  if (Count < MemOPCountThreshold) +    return false; +  if (Count < TotalCount * MemOPPercentThreshold / 100) +    return false; +  return true; +} + +static inline uint64_t getScaledCount(uint64_t Count, uint64_t Num, +                                      uint64_t Denom) { +  if (!MemOPScaleCount) +    return Count; +  bool Overflowed; +  uint64_t ScaleCount = SaturatingMultiply(Count, Num, &Overflowed); +  return ScaleCount / Denom; +} + +bool MemOPSizeOpt::perform(MemIntrinsic *MI) { +  assert(MI); +  if (MI->getIntrinsicID() == Intrinsic::memmove) +    return false; + +  uint32_t NumVals, MaxNumPromotions = MemOPMaxVersion + 2; +  uint64_t TotalCount; +  if (!getValueProfDataFromInst(*MI, IPVK_MemOPSize, MaxNumPromotions, +                                ValueDataArray.get(), NumVals, TotalCount)) +    return false; + +  uint64_t ActualCount = TotalCount; +  uint64_t SavedTotalCount = TotalCount; +  if (MemOPScaleCount) { +    auto BBEdgeCount = BFI.getBlockProfileCount(MI->getParent()); +    if (!BBEdgeCount) +      return false; +    ActualCount = *BBEdgeCount; +  } + +  if (ActualCount < MemOPCountThreshold) +    return false; + +  ArrayRef<InstrProfValueData> VDs(ValueDataArray.get(), NumVals); +  TotalCount = ActualCount; +  if (MemOPScaleCount) +    DEBUG(dbgs() << "Scale counts: numberator = " << ActualCount +                 << " denominator = " << SavedTotalCount << "\n"); + +  // Keeping track of the count of the default case: +  uint64_t RemainCount = TotalCount; +  SmallVector<uint64_t, 16> SizeIds; +  SmallVector<uint64_t, 16> CaseCounts; +  uint64_t MaxCount = 0; +  unsigned Version = 0; +  // Default case is in the front -- save the slot here. +  CaseCounts.push_back(0); +  for (auto &VD : VDs) { +    int64_t V = VD.Value; +    uint64_t C = VD.Count; +    if (MemOPScaleCount) +      C = getScaledCount(C, ActualCount, SavedTotalCount); + +    // Only care precise value here. +    if (getMemOPSizeKind(V) != PreciseValue) +      continue; + +    // ValueCounts are sorted on the count. Break at the first un-profitable +    // value. +    if (!isProfitable(C, RemainCount)) +      break; + +    SizeIds.push_back(V); +    CaseCounts.push_back(C); +    if (C > MaxCount) +      MaxCount = C; + +    assert(RemainCount >= C); +    RemainCount -= C; + +    if (++Version > MemOPMaxVersion && MemOPMaxVersion != 0) +      break; +  } + +  if (Version == 0) +    return false; + +  CaseCounts[0] = RemainCount; +  if (RemainCount > MaxCount) +    MaxCount = RemainCount; + +  uint64_t SumForOpt = TotalCount - RemainCount; +  DEBUG(dbgs() << "Read one memory intrinsic profile: " << SumForOpt << " vs " +               << TotalCount << "\n"); +  DEBUG( +      for (auto &VD +           : VDs) { dbgs() << "  (" << VD.Value << "," << VD.Count << ")\n"; }); + +  DEBUG(dbgs() << "Optimize one memory intrinsic call to " << Version +               << " Versions\n"); + +  // mem_op(..., size) +  // ==> +  // switch (size) { +  //   case s1: +  //      mem_op(..., s1); +  //      goto merge_bb; +  //   case s2: +  //      mem_op(..., s2); +  //      goto merge_bb; +  //   ... +  //   default: +  //      mem_op(..., size); +  //      goto merge_bb; +  // } +  // merge_bb: + +  BasicBlock *BB = MI->getParent(); +  DEBUG(dbgs() << "\n\n== Basic Block Before ==\n"); +  DEBUG(dbgs() << *BB << "\n"); + +  BasicBlock *DefaultBB = SplitBlock(BB, MI); +  BasicBlock::iterator It(*MI); +  ++It; +  assert(It != DefaultBB->end()); +  BasicBlock *MergeBB = SplitBlock(DefaultBB, &(*It)); +  DefaultBB->setName("MemOP.Default"); +  MergeBB->setName("MemOP.Merge"); + +  auto &Ctx = Func.getContext(); +  IRBuilder<> IRB(BB); +  BB->getTerminator()->eraseFromParent(); +  Value *SizeVar = MI->getLength(); +  SwitchInst *SI = IRB.CreateSwitch(SizeVar, DefaultBB, SizeIds.size()); + +  // Clear the value profile data. +  MI->setMetadata(LLVMContext::MD_prof, nullptr); + +  DEBUG(dbgs() << "\n\n== Basic Block After==\n"); + +  for (uint64_t SizeId : SizeIds) { +    ConstantInt *CaseSizeId = ConstantInt::get(Type::getInt64Ty(Ctx), SizeId); +    BasicBlock *CaseBB = BasicBlock::Create( +        Ctx, Twine("MemOP.Case.") + Twine(SizeId), &Func, DefaultBB); +    Instruction *NewInst = MI->clone(); +    // Fix the argument. +    dyn_cast<MemIntrinsic>(NewInst)->setLength(CaseSizeId); +    CaseBB->getInstList().push_back(NewInst); +    IRBuilder<> IRBCase(CaseBB); +    IRBCase.CreateBr(MergeBB); +    SI->addCase(CaseSizeId, CaseBB); +    DEBUG(dbgs() << *CaseBB << "\n"); +  } +  setProfMetadata(Func.getParent(), SI, CaseCounts, MaxCount); + +  DEBUG(dbgs() << *BB << "\n"); +  DEBUG(dbgs() << *DefaultBB << "\n"); +  DEBUG(dbgs() << *MergeBB << "\n"); + +  emitOptimizationRemark(Func.getContext(), "memop-opt", Func, +                         MI->getDebugLoc(), +                         Twine("optimize ") + getMIName(MI) + " with count " + +                             Twine(SumForOpt) + " out of " + Twine(TotalCount) + +                             " for " + Twine(Version) + " versions"); + +  return true; +} +} // namespace + +static bool PGOMemOPSizeOptImpl(Function &F, BlockFrequencyInfo &BFI) { +  if (DisableMemOPOPT) +    return false; + +  if (F.hasFnAttribute(Attribute::OptimizeForSize)) +    return false; +  MemOPSizeOpt MemOPSizeOpt(F, BFI); +  MemOPSizeOpt.perform(); +  return MemOPSizeOpt.isChanged(); +} + +bool PGOMemOPSizeOptLegacyPass::runOnFunction(Function &F) { +  BlockFrequencyInfo &BFI = +      getAnalysis<BlockFrequencyInfoWrapperPass>().getBFI(); +  return PGOMemOPSizeOptImpl(F, BFI); +} + +namespace llvm { +char &PGOMemOPSizeOptID = PGOMemOPSizeOptLegacyPass::ID; + +PreservedAnalyses PGOMemOPSizeOpt::run(Function &F, +                                       FunctionAnalysisManager &FAM) { +  auto &BFI = FAM.getResult<BlockFrequencyAnalysis>(F); +  bool Changed = PGOMemOPSizeOptImpl(F, BFI); +  if (!Changed) +    return PreservedAnalyses::all(); +  auto  PA = PreservedAnalyses(); +  PA.preserve<GlobalsAA>(); +  return PA; +} +} // namespace llvm diff --git a/lib/Transforms/Instrumentation/InstrProfiling.cpp b/lib/Transforms/Instrumentation/InstrProfiling.cpp index adea7e772447..d91ac6ac7883 100644 --- a/lib/Transforms/Instrumentation/InstrProfiling.cpp +++ b/lib/Transforms/Instrumentation/InstrProfiling.cpp @@ -14,18 +14,58 @@  //===----------------------------------------------------------------------===//  #include "llvm/Transforms/InstrProfiling.h" +#include "llvm/ADT/ArrayRef.h" +#include "llvm/ADT/SmallVector.h" +#include "llvm/ADT/StringRef.h"  #include "llvm/ADT/Triple.h" +#include "llvm/ADT/Twine.h"  #include "llvm/Analysis/TargetLibraryInfo.h" -#include "llvm/IR/IRBuilder.h" +#include "llvm/IR/Attributes.h" +#include "llvm/IR/BasicBlock.h" +#include "llvm/IR/Constant.h" +#include "llvm/IR/Constants.h" +#include "llvm/IR/DerivedTypes.h" +#include "llvm/IR/Function.h" +#include "llvm/IR/GlobalValue.h" +#include "llvm/IR/GlobalVariable.h" +#include "llvm/IR/Instruction.h" +#include "llvm/IR/Instructions.h"  #include "llvm/IR/IntrinsicInst.h" +#include "llvm/IR/IRBuilder.h"  #include "llvm/IR/Module.h" +#include "llvm/IR/Type.h" +#include "llvm/Pass.h"  #include "llvm/ProfileData/InstrProf.h" +#include "llvm/Support/Casting.h" +#include "llvm/Support/CommandLine.h" +#include "llvm/Support/Error.h" +#include "llvm/Support/ErrorHandling.h"  #include "llvm/Transforms/Utils/ModuleUtils.h" +#include <algorithm> +#include <cassert> +#include <cstddef> +#include <cstdint> +#include <string>  using namespace llvm;  #define DEBUG_TYPE "instrprof" +// The start and end values of precise value profile range for memory +// intrinsic sizes +cl::opt<std::string> MemOPSizeRange( +    "memop-size-range", +    cl::desc("Set the range of size in memory intrinsic calls to be profiled " +             "precisely, in a format of <start_val>:<end_val>"), +    cl::init("")); + +// The value that considered to be large value in  memory intrinsic. +cl::opt<unsigned> MemOPSizeLarge( +    "memop-size-large", +    cl::desc("Set large value thresthold in memory intrinsic size profiling. " +             "Value of 0 disables the large value profiling."), +    cl::init(8192)); +  namespace {  cl::opt<bool> DoNameCompression("enable-name-compression", @@ -41,6 +81,7 @@ cl::opt<bool> ValueProfileStaticAlloc(      "vp-static-alloc",      cl::desc("Do static counter allocation for value profiler"),      cl::init(true)); +  cl::opt<double> NumCountersPerValueSite(      "vp-counters-per-site",      cl::desc("The average number of profile counters allocated " @@ -56,9 +97,11 @@ class InstrProfilingLegacyPass : public ModulePass {  public:    static char ID; -  InstrProfilingLegacyPass() : ModulePass(ID), InstrProf() {} + +  InstrProfilingLegacyPass() : ModulePass(ID) {}    InstrProfilingLegacyPass(const InstrProfOptions &Options)        : ModulePass(ID), InstrProf(Options) {} +    StringRef getPassName() const override {      return "Frontend instrumentation-based coverage lowering";    } @@ -73,7 +116,7 @@ public:    }  }; -} // anonymous namespace +} // end anonymous namespace  PreservedAnalyses InstrProfiling::run(Module &M, ModuleAnalysisManager &AM) {    auto &TLI = AM.getResult<TargetLibraryAnalysis>(M); @@ -97,30 +140,6 @@ llvm::createInstrProfilingLegacyPass(const InstrProfOptions &Options) {    return new InstrProfilingLegacyPass(Options);  } -bool InstrProfiling::isMachO() const { -  return Triple(M->getTargetTriple()).isOSBinFormatMachO(); -} - -/// Get the section name for the counter variables. -StringRef InstrProfiling::getCountersSection() const { -  return getInstrProfCountersSectionName(isMachO()); -} - -/// Get the section name for the name variables. -StringRef InstrProfiling::getNameSection() const { -  return getInstrProfNameSectionName(isMachO()); -} - -/// Get the section name for the profile data variables. -StringRef InstrProfiling::getDataSection() const { -  return getInstrProfDataSectionName(isMachO()); -} - -/// Get the section name for the coverage mapping data. -StringRef InstrProfiling::getCoverageSection() const { -  return getInstrProfCoverageSectionName(isMachO()); -} -  static InstrProfIncrementInst *castToIncrementInst(Instruction *Instr) {    InstrProfIncrementInst *Inc = dyn_cast<InstrProfIncrementInstStep>(Instr);    if (Inc) @@ -137,6 +156,9 @@ bool InstrProfiling::run(Module &M, const TargetLibraryInfo &TLI) {    NamesSize = 0;    ProfileDataMap.clear();    UsedVars.clear(); +  getMemOPSizeRangeFromOption(MemOPSizeRange, MemOPSizeRangeStart, +                              MemOPSizeRangeLast); +  TT = Triple(M.getTargetTriple());    // We did not know how many value sites there would be inside    // the instrumented function. This is counting the number of instrumented @@ -189,17 +211,34 @@ bool InstrProfiling::run(Module &M, const TargetLibraryInfo &TLI) {  }  static Constant *getOrInsertValueProfilingCall(Module &M, -                                               const TargetLibraryInfo &TLI) { +                                               const TargetLibraryInfo &TLI, +                                               bool IsRange = false) {    LLVMContext &Ctx = M.getContext();    auto *ReturnTy = Type::getVoidTy(M.getContext()); -  Type *ParamTypes[] = { + +  Constant *Res; +  if (!IsRange) { +    Type *ParamTypes[] = {  #define VALUE_PROF_FUNC_PARAM(ParamType, ParamName, ParamLLVMType) ParamLLVMType  #include "llvm/ProfileData/InstrProfData.inc" -  }; -  auto *ValueProfilingCallTy = -      FunctionType::get(ReturnTy, makeArrayRef(ParamTypes), false); -  Constant *Res = M.getOrInsertFunction(getInstrProfValueProfFuncName(), -                                        ValueProfilingCallTy); +    }; +    auto *ValueProfilingCallTy = +        FunctionType::get(ReturnTy, makeArrayRef(ParamTypes), false); +    Res = M.getOrInsertFunction(getInstrProfValueProfFuncName(), +                                ValueProfilingCallTy); +  } else { +    Type *RangeParamTypes[] = { +#define VALUE_RANGE_PROF 1 +#define VALUE_PROF_FUNC_PARAM(ParamType, ParamName, ParamLLVMType) ParamLLVMType +#include "llvm/ProfileData/InstrProfData.inc" +#undef VALUE_RANGE_PROF +    }; +    auto *ValueRangeProfilingCallTy = +        FunctionType::get(ReturnTy, makeArrayRef(RangeParamTypes), false); +    Res = M.getOrInsertFunction(getInstrProfValueRangeProfFuncName(), +                                ValueRangeProfilingCallTy); +  } +    if (Function *FunRes = dyn_cast<Function>(Res)) {      if (auto AK = TLI.getExtAttrForI32Param(false))        FunRes->addAttribute(3, AK); @@ -208,7 +247,6 @@ static Constant *getOrInsertValueProfilingCall(Module &M,  }  void InstrProfiling::computeNumValueSiteCounts(InstrProfValueProfileInst *Ind) { -    GlobalVariable *Name = Ind->getName();    uint64_t ValueKind = Ind->getValueKind()->getZExtValue();    uint64_t Index = Ind->getIndex()->getZExtValue(); @@ -222,7 +260,6 @@ void InstrProfiling::computeNumValueSiteCounts(InstrProfValueProfileInst *Ind) {  }  void InstrProfiling::lowerValueProfileInst(InstrProfValueProfileInst *Ind) { -    GlobalVariable *Name = Ind->getName();    auto It = ProfileDataMap.find(Name);    assert(It != ProfileDataMap.end() && It->second.DataVar && @@ -235,11 +272,25 @@ void InstrProfiling::lowerValueProfileInst(InstrProfValueProfileInst *Ind) {      Index += It->second.NumValueSites[Kind];    IRBuilder<> Builder(Ind); -  Value *Args[3] = {Ind->getTargetValue(), -                    Builder.CreateBitCast(DataVar, Builder.getInt8PtrTy()), -                    Builder.getInt32(Index)}; -  CallInst *Call = Builder.CreateCall(getOrInsertValueProfilingCall(*M, *TLI), -                                      Args); +  bool IsRange = (Ind->getValueKind()->getZExtValue() == +                  llvm::InstrProfValueKind::IPVK_MemOPSize); +  CallInst *Call = nullptr; +  if (!IsRange) { +    Value *Args[3] = {Ind->getTargetValue(), +                      Builder.CreateBitCast(DataVar, Builder.getInt8PtrTy()), +                      Builder.getInt32(Index)}; +    Call = Builder.CreateCall(getOrInsertValueProfilingCall(*M, *TLI), Args); +  } else { +    Value *Args[6] = { +        Ind->getTargetValue(), +        Builder.CreateBitCast(DataVar, Builder.getInt8PtrTy()), +        Builder.getInt32(Index), +        Builder.getInt64(MemOPSizeRangeStart), +        Builder.getInt64(MemOPSizeRangeLast), +        Builder.getInt64(MemOPSizeLarge == 0 ? INT64_MIN : MemOPSizeLarge)}; +    Call = +        Builder.CreateCall(getOrInsertValueProfilingCall(*M, *TLI, true), Args); +  }    if (auto AK = TLI->getExtAttrForI32Param(false))      Call->addAttribute(3, AK);    Ind->replaceAllUsesWith(Call); @@ -259,7 +310,6 @@ void InstrProfiling::lowerIncrement(InstrProfIncrementInst *Inc) {  }  void InstrProfiling::lowerCoverageData(GlobalVariable *CoverageNamesVar) { -    ConstantArray *Names =        cast<ConstantArray>(CoverageNamesVar->getInitializer());    for (unsigned I = 0, E = Names->getNumOperands(); I < E; ++I) { @@ -270,7 +320,9 @@ void InstrProfiling::lowerCoverageData(GlobalVariable *CoverageNamesVar) {      Name->setLinkage(GlobalValue::PrivateLinkage);      ReferencedNames.push_back(Name); +    NC->dropAllReferences();    } +  CoverageNamesVar->eraseFromParent();  }  /// Get the name of a profiling variable for a particular function. @@ -367,7 +419,8 @@ InstrProfiling::getOrCreateRegionCounters(InstrProfIncrementInst *Inc) {                           Constant::getNullValue(CounterTy),                           getVarName(Inc, getInstrProfCountersVarPrefix()));    CounterPtr->setVisibility(NamePtr->getVisibility()); -  CounterPtr->setSection(getCountersSection()); +  CounterPtr->setSection( +      getInstrProfSectionName(IPSK_cnts, TT.getObjectFormat()));    CounterPtr->setAlignment(8);    CounterPtr->setComdat(ProfileVarsComdat); @@ -376,7 +429,6 @@ InstrProfiling::getOrCreateRegionCounters(InstrProfIncrementInst *Inc) {    // the current function.    Constant *ValuesPtrExpr = ConstantPointerNull::get(Int8PtrTy);    if (ValueProfileStaticAlloc && !needsRuntimeRegistrationOfSectionRange(*M)) { -      uint64_t NS = 0;      for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind)        NS += PD.NumValueSites[Kind]; @@ -388,11 +440,12 @@ InstrProfiling::getOrCreateRegionCounters(InstrProfIncrementInst *Inc) {                               Constant::getNullValue(ValuesTy),                               getVarName(Inc, getInstrProfValuesVarPrefix()));        ValuesVar->setVisibility(NamePtr->getVisibility()); -      ValuesVar->setSection(getInstrProfValuesSectionName(isMachO())); +      ValuesVar->setSection( +          getInstrProfSectionName(IPSK_vals, TT.getObjectFormat()));        ValuesVar->setAlignment(8);        ValuesVar->setComdat(ProfileVarsComdat);        ValuesPtrExpr = -          ConstantExpr::getBitCast(ValuesVar, llvm::Type::getInt8PtrTy(Ctx)); +          ConstantExpr::getBitCast(ValuesVar, Type::getInt8PtrTy(Ctx));      }    } @@ -421,7 +474,7 @@ InstrProfiling::getOrCreateRegionCounters(InstrProfIncrementInst *Inc) {                                    ConstantStruct::get(DataTy, DataVals),                                    getVarName(Inc, getInstrProfDataVarPrefix()));    Data->setVisibility(NamePtr->getVisibility()); -  Data->setSection(getDataSection()); +  Data->setSection(getInstrProfSectionName(IPSK_data, TT.getObjectFormat()));    Data->setAlignment(INSTR_PROF_DATA_ALIGNMENT);    Data->setComdat(ProfileVarsComdat); @@ -481,9 +534,10 @@ void InstrProfiling::emitVNodes() {    ArrayType *VNodesTy = ArrayType::get(VNodeTy, NumCounters);    auto *VNodesVar = new GlobalVariable( -      *M, VNodesTy, false, llvm::GlobalValue::PrivateLinkage, +      *M, VNodesTy, false, GlobalValue::PrivateLinkage,        Constant::getNullValue(VNodesTy), getInstrProfVNodesVarName()); -  VNodesVar->setSection(getInstrProfVNodesSectionName(isMachO())); +  VNodesVar->setSection( +      getInstrProfSectionName(IPSK_vnodes, TT.getObjectFormat()));    UsedVars.push_back(VNodesVar);  } @@ -496,18 +550,22 @@ void InstrProfiling::emitNameData() {    std::string CompressedNameStr;    if (Error E = collectPGOFuncNameStrings(ReferencedNames, CompressedNameStr,                                            DoNameCompression)) { -    llvm::report_fatal_error(toString(std::move(E)), false); +    report_fatal_error(toString(std::move(E)), false);    }    auto &Ctx = M->getContext(); -  auto *NamesVal = llvm::ConstantDataArray::getString( +  auto *NamesVal = ConstantDataArray::getString(        Ctx, StringRef(CompressedNameStr), false); -  NamesVar = new llvm::GlobalVariable(*M, NamesVal->getType(), true, -                                      llvm::GlobalValue::PrivateLinkage, -                                      NamesVal, getInstrProfNamesVarName()); +  NamesVar = new GlobalVariable(*M, NamesVal->getType(), true, +                                GlobalValue::PrivateLinkage, NamesVal, +                                getInstrProfNamesVarName());    NamesSize = CompressedNameStr.size(); -  NamesVar->setSection(getNameSection()); +  NamesVar->setSection( +      getInstrProfSectionName(IPSK_name, TT.getObjectFormat()));    UsedVars.push_back(NamesVar); + +  for (auto *NamePtr : ReferencedNames) +    NamePtr->eraseFromParent();  }  void InstrProfiling::emitRegistration() { @@ -550,7 +608,6 @@ void InstrProfiling::emitRegistration() {  }  void InstrProfiling::emitRuntimeHook() { -    // We expect the linker to be invoked with -u<hook_var> flag for linux,    // for which case there is no need to emit the user function.    if (Triple(M->getTargetTriple()).isOSLinux()) @@ -600,7 +657,6 @@ void InstrProfiling::emitInitialization() {      GlobalVariable *ProfileNameVar = new GlobalVariable(          *M, ProfileNameConst->getType(), true, GlobalValue::WeakAnyLinkage,          ProfileNameConst, INSTR_PROF_QUOTE(INSTR_PROF_PROFILE_NAME_VAR)); -    Triple TT(M->getTargetTriple());      if (TT.supportsCOMDAT()) {        ProfileNameVar->setLinkage(GlobalValue::ExternalLinkage);        ProfileNameVar->setComdat(M->getOrInsertComdat( diff --git a/lib/Transforms/Instrumentation/Instrumentation.cpp b/lib/Transforms/Instrumentation/Instrumentation.cpp index 2963d08752c4..7bb62d2c8455 100644 --- a/lib/Transforms/Instrumentation/Instrumentation.cpp +++ b/lib/Transforms/Instrumentation/Instrumentation.cpp @@ -63,6 +63,7 @@ void llvm::initializeInstrumentation(PassRegistry &Registry) {    initializePGOInstrumentationGenLegacyPassPass(Registry);    initializePGOInstrumentationUseLegacyPassPass(Registry);    initializePGOIndirectCallPromotionLegacyPassPass(Registry); +  initializePGOMemOPSizeOptLegacyPassPass(Registry);    initializeInstrProfilingLegacyPassPass(Registry);    initializeMemorySanitizerPass(Registry);    initializeThreadSanitizerPass(Registry); diff --git a/lib/Transforms/Instrumentation/MemorySanitizer.cpp b/lib/Transforms/Instrumentation/MemorySanitizer.cpp index fafb0fcbd017..190f05db4b0c 100644 --- a/lib/Transforms/Instrumentation/MemorySanitizer.cpp +++ b/lib/Transforms/Instrumentation/MemorySanitizer.cpp @@ -425,7 +425,7 @@ void MemorySanitizer::initializeCallbacks(Module &M) {    // which is not yet implemented.    StringRef WarningFnName = Recover ? "__msan_warning"                                      : "__msan_warning_noreturn"; -  WarningFn = M.getOrInsertFunction(WarningFnName, IRB.getVoidTy(), nullptr); +  WarningFn = M.getOrInsertFunction(WarningFnName, IRB.getVoidTy());    for (size_t AccessSizeIndex = 0; AccessSizeIndex < kNumberOfAccessSizes;         AccessSizeIndex++) { @@ -433,31 +433,31 @@ void MemorySanitizer::initializeCallbacks(Module &M) {      std::string FunctionName = "__msan_maybe_warning_" + itostr(AccessSize);      MaybeWarningFn[AccessSizeIndex] = M.getOrInsertFunction(          FunctionName, IRB.getVoidTy(), IRB.getIntNTy(AccessSize * 8), -        IRB.getInt32Ty(), nullptr); +        IRB.getInt32Ty());      FunctionName = "__msan_maybe_store_origin_" + itostr(AccessSize);      MaybeStoreOriginFn[AccessSizeIndex] = M.getOrInsertFunction(          FunctionName, IRB.getVoidTy(), IRB.getIntNTy(AccessSize * 8), -        IRB.getInt8PtrTy(), IRB.getInt32Ty(), nullptr); +        IRB.getInt8PtrTy(), IRB.getInt32Ty());    }    MsanSetAllocaOrigin4Fn = M.getOrInsertFunction(      "__msan_set_alloca_origin4", IRB.getVoidTy(), IRB.getInt8PtrTy(), IntptrTy, -    IRB.getInt8PtrTy(), IntptrTy, nullptr); +    IRB.getInt8PtrTy(), IntptrTy);    MsanPoisonStackFn =        M.getOrInsertFunction("__msan_poison_stack", IRB.getVoidTy(), -                            IRB.getInt8PtrTy(), IntptrTy, nullptr); +                            IRB.getInt8PtrTy(), IntptrTy);    MsanChainOriginFn = M.getOrInsertFunction( -    "__msan_chain_origin", IRB.getInt32Ty(), IRB.getInt32Ty(), nullptr); +    "__msan_chain_origin", IRB.getInt32Ty(), IRB.getInt32Ty());    MemmoveFn = M.getOrInsertFunction(      "__msan_memmove", IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -    IRB.getInt8PtrTy(), IntptrTy, nullptr); +    IRB.getInt8PtrTy(), IntptrTy);    MemcpyFn = M.getOrInsertFunction(      "__msan_memcpy", IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -    IntptrTy, nullptr); +    IntptrTy);    MemsetFn = M.getOrInsertFunction(      "__msan_memset", IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), IRB.getInt32Ty(), -    IntptrTy, nullptr); +    IntptrTy);    // Create globals.    RetvalTLS = new GlobalVariable( @@ -1037,15 +1037,19 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {      OriginMap[V] = Origin;    } +  Constant *getCleanShadow(Type *OrigTy) { +    Type *ShadowTy = getShadowTy(OrigTy); +    if (!ShadowTy) +      return nullptr; +    return Constant::getNullValue(ShadowTy); +  } +    /// \brief Create a clean shadow value for a given value.    ///    /// Clean shadow (all zeroes) means all bits of the value are defined    /// (initialized).    Constant *getCleanShadow(Value *V) { -    Type *ShadowTy = getShadowTy(V); -    if (!ShadowTy) -      return nullptr; -    return Constant::getNullValue(ShadowTy); +    return getCleanShadow(V->getType());    }    /// \brief Create a dirty shadow of a given shadow type. @@ -1942,7 +1946,6 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {      if (ClCheckAccessAddress)        insertShadowCheck(Addr, &I); -    // FIXME: use ClStoreCleanOrigin      // FIXME: factor out common code from materializeStores      if (MS.TrackOrigins)        IRB.CreateStore(getOrigin(&I, 1), getOriginPtr(Addr, IRB, 1)); @@ -2325,11 +2328,49 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {      setOriginForNaryOp(I);    } +  void handleStmxcsr(IntrinsicInst &I) { +    IRBuilder<> IRB(&I); +    Value* Addr = I.getArgOperand(0); +    Type *Ty = IRB.getInt32Ty(); +    Value *ShadowPtr = getShadowPtr(Addr, Ty, IRB); + +    IRB.CreateStore(getCleanShadow(Ty), +                    IRB.CreatePointerCast(ShadowPtr, Ty->getPointerTo())); + +    if (ClCheckAccessAddress) +      insertShadowCheck(Addr, &I); +  } + +  void handleLdmxcsr(IntrinsicInst &I) { +    if (!InsertChecks) return; + +    IRBuilder<> IRB(&I); +    Value *Addr = I.getArgOperand(0); +    Type *Ty = IRB.getInt32Ty(); +    unsigned Alignment = 1; + +    if (ClCheckAccessAddress) +      insertShadowCheck(Addr, &I); + +    Value *Shadow = IRB.CreateAlignedLoad(getShadowPtr(Addr, Ty, IRB), +                                          Alignment, "_ldmxcsr"); +    Value *Origin = MS.TrackOrigins +                        ? IRB.CreateLoad(getOriginPtr(Addr, IRB, Alignment)) +                        : getCleanOrigin(); +    insertShadowCheck(Shadow, Origin, &I); +  } +    void visitIntrinsicInst(IntrinsicInst &I) {      switch (I.getIntrinsicID()) {      case llvm::Intrinsic::bswap:        handleBswap(I);        break; +    case llvm::Intrinsic::x86_sse_stmxcsr: +      handleStmxcsr(I); +      break; +    case llvm::Intrinsic::x86_sse_ldmxcsr: +      handleLdmxcsr(I); +      break;      case llvm::Intrinsic::x86_avx512_vcvtsd2usi64:      case llvm::Intrinsic::x86_avx512_vcvtsd2usi32:      case llvm::Intrinsic::x86_avx512_vcvtss2usi64: @@ -2566,10 +2607,10 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {          AttrBuilder B;          B.addAttribute(Attribute::ReadOnly)            .addAttribute(Attribute::ReadNone); -        Func->removeAttributes(AttributeSet::FunctionIndex, -                               AttributeSet::get(Func->getContext(), -                                                 AttributeSet::FunctionIndex, -                                                 B)); +        Func->removeAttributes(AttributeList::FunctionIndex, +                               AttributeList::get(Func->getContext(), +                                                  AttributeList::FunctionIndex, +                                                  B));        }        maybeMarkSanitizerLibraryCallNoBuiltin(Call, TLI); @@ -2597,7 +2638,7 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {              " Shadow: " << *ArgShadow << "\n");        bool ArgIsInitialized = false;        const DataLayout &DL = F.getParent()->getDataLayout(); -      if (CS.paramHasAttr(i + 1, Attribute::ByVal)) { +      if (CS.paramHasAttr(i, Attribute::ByVal)) {          assert(A->getType()->isPointerTy() &&                 "ByVal argument is not a pointer!");          Size = DL.getTypeAllocSize(A->getType()->getPointerElementType()); @@ -2690,7 +2731,6 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {      } else {        Value *Shadow = getShadow(RetVal);        IRB.CreateAlignedStore(Shadow, ShadowPtr, kShadowTLSAlignment); -      // FIXME: make it conditional if ClStoreCleanOrigin==0        if (MS.TrackOrigins)          IRB.CreateStore(getOrigin(RetVal), getOriginPtrForRetval(IRB));      } @@ -2717,15 +2757,17 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {      setOrigin(&I, getCleanOrigin());      IRBuilder<> IRB(I.getNextNode());      const DataLayout &DL = F.getParent()->getDataLayout(); -    uint64_t Size = DL.getTypeAllocSize(I.getAllocatedType()); +    uint64_t TypeSize = DL.getTypeAllocSize(I.getAllocatedType()); +    Value *Len = ConstantInt::get(MS.IntptrTy, TypeSize); +    if (I.isArrayAllocation()) +      Len = IRB.CreateMul(Len, I.getArraySize());      if (PoisonStack && ClPoisonStackWithCall) {        IRB.CreateCall(MS.MsanPoisonStackFn, -                     {IRB.CreatePointerCast(&I, IRB.getInt8PtrTy()), -                      ConstantInt::get(MS.IntptrTy, Size)}); +                     {IRB.CreatePointerCast(&I, IRB.getInt8PtrTy()), Len});      } else {        Value *ShadowBase = getShadowPtr(&I, Type::getInt8PtrTy(*MS.C), IRB);        Value *PoisonValue = IRB.getInt8(PoisonStack ? ClPoisonStackPattern : 0); -      IRB.CreateMemSet(ShadowBase, PoisonValue, Size, I.getAlignment()); +      IRB.CreateMemSet(ShadowBase, PoisonValue, Len, I.getAlignment());      }      if (PoisonStack && MS.TrackOrigins) { @@ -2742,8 +2784,7 @@ struct MemorySanitizerVisitor : public InstVisitor<MemorySanitizerVisitor> {                                                 StackDescription.str());        IRB.CreateCall(MS.MsanSetAllocaOrigin4Fn, -                     {IRB.CreatePointerCast(&I, IRB.getInt8PtrTy()), -                      ConstantInt::get(MS.IntptrTy, Size), +                     {IRB.CreatePointerCast(&I, IRB.getInt8PtrTy()), Len,                        IRB.CreatePointerCast(Descr, IRB.getInt8PtrTy()),                        IRB.CreatePointerCast(&F, MS.IntptrTy)});      } @@ -2935,7 +2976,7 @@ struct VarArgAMD64Helper : public VarArgHelper {        Value *A = *ArgIt;        unsigned ArgNo = CS.getArgumentNo(ArgIt);        bool IsFixed = ArgNo < CS.getFunctionType()->getNumParams(); -      bool IsByVal = CS.paramHasAttr(ArgNo + 1, Attribute::ByVal); +      bool IsByVal = CS.paramHasAttr(ArgNo, Attribute::ByVal);        if (IsByVal) {          // ByVal arguments always go to the overflow area.          // Fixed arguments passed through the overflow area will be stepped @@ -3456,7 +3497,7 @@ struct VarArgPowerPC64Helper : public VarArgHelper {        Value *A = *ArgIt;        unsigned ArgNo = CS.getArgumentNo(ArgIt);        bool IsFixed = ArgNo < CS.getFunctionType()->getNumParams(); -      bool IsByVal = CS.paramHasAttr(ArgNo + 1, Attribute::ByVal); +      bool IsByVal = CS.paramHasAttr(ArgNo, Attribute::ByVal);        if (IsByVal) {          assert(A->getType()->isPointerTy());          Type *RealTy = A->getType()->getPointerElementType(); @@ -3618,9 +3659,9 @@ bool MemorySanitizer::runOnFunction(Function &F) {    AttrBuilder B;    B.addAttribute(Attribute::ReadOnly)      .addAttribute(Attribute::ReadNone); -  F.removeAttributes(AttributeSet::FunctionIndex, -                     AttributeSet::get(F.getContext(), -                                       AttributeSet::FunctionIndex, B)); +  F.removeAttributes( +      AttributeList::FunctionIndex, +      AttributeList::get(F.getContext(), AttributeList::FunctionIndex, B));    return Visitor.runOnFunction();  } diff --git a/lib/Transforms/Instrumentation/PGOInstrumentation.cpp b/lib/Transforms/Instrumentation/PGOInstrumentation.cpp index 04f9a64bef9f..990bcec109de 100644 --- a/lib/Transforms/Instrumentation/PGOInstrumentation.cpp +++ b/lib/Transforms/Instrumentation/PGOInstrumentation.cpp @@ -58,8 +58,10 @@  #include "llvm/Analysis/BranchProbabilityInfo.h"  #include "llvm/Analysis/CFG.h"  #include "llvm/Analysis/IndirectCallSiteVisitor.h" +#include "llvm/Analysis/LoopInfo.h"  #include "llvm/IR/CallSite.h"  #include "llvm/IR/DiagnosticInfo.h" +#include "llvm/IR/Dominators.h"  #include "llvm/IR/GlobalValue.h"  #include "llvm/IR/IRBuilder.h"  #include "llvm/IR/InstIterator.h" @@ -71,7 +73,9 @@  #include "llvm/ProfileData/InstrProfReader.h"  #include "llvm/ProfileData/ProfileCommon.h"  #include "llvm/Support/BranchProbability.h" +#include "llvm/Support/DOTGraphTraits.h"  #include "llvm/Support/Debug.h" +#include "llvm/Support/GraphWriter.h"  #include "llvm/Support/JamCRC.h"  #include "llvm/Transforms/Instrumentation.h"  #include "llvm/Transforms/Utils/BasicBlockUtils.h" @@ -87,6 +91,7 @@ using namespace llvm;  STATISTIC(NumOfPGOInstrument, "Number of edges instrumented.");  STATISTIC(NumOfPGOSelectInsts, "Number of select instruction instrumented."); +STATISTIC(NumOfPGOMemIntrinsics, "Number of mem intrinsics instrumented.");  STATISTIC(NumOfPGOEdge, "Number of edges.");  STATISTIC(NumOfPGOBB, "Number of basic-blocks.");  STATISTIC(NumOfPGOSplit, "Number of critical edge splits."); @@ -116,6 +121,13 @@ static cl::opt<unsigned> MaxNumAnnotations(      cl::desc("Max number of annotations for a single indirect "               "call callsite")); +// Command line option to set the maximum number of value annotations +// to write to the metadata for a single memop intrinsic. +static cl::opt<unsigned> MaxNumMemOPAnnotations( +    "memop-max-annotations", cl::init(4), cl::Hidden, cl::ZeroOrMore, +    cl::desc("Max number of preicise value annotations for a single memop" +             "intrinsic")); +  // Command line option to control appending FunctionHash to the name of a COMDAT  // function. This is to avoid the hash mismatch caused by the preinliner.  static cl::opt<bool> DoComdatRenaming( @@ -125,24 +137,59 @@ static cl::opt<bool> DoComdatRenaming(  // Command line option to enable/disable the warning about missing profile  // information. -static cl::opt<bool> PGOWarnMissing("pgo-warn-missing-function", -                                     cl::init(false), -                                     cl::Hidden); +static cl::opt<bool> +    PGOWarnMissing("pgo-warn-missing-function", cl::init(false), cl::Hidden, +                   cl::desc("Use this option to turn on/off " +                            "warnings about missing profile data for " +                            "functions."));  // Command line option to enable/disable the warning about a hash mismatch in  // the profile data. -static cl::opt<bool> NoPGOWarnMismatch("no-pgo-warn-mismatch", cl::init(false), -                                       cl::Hidden); +static cl::opt<bool> +    NoPGOWarnMismatch("no-pgo-warn-mismatch", cl::init(false), cl::Hidden, +                      cl::desc("Use this option to turn off/on " +                               "warnings about profile cfg mismatch."));  // Command line option to enable/disable the warning about a hash mismatch in  // the profile data for Comdat functions, which often turns out to be false  // positive due to the pre-instrumentation inline. -static cl::opt<bool> NoPGOWarnMismatchComdat("no-pgo-warn-mismatch-comdat", -                                             cl::init(true), cl::Hidden); +static cl::opt<bool> +    NoPGOWarnMismatchComdat("no-pgo-warn-mismatch-comdat", cl::init(true), +                            cl::Hidden, +                            cl::desc("The option is used to turn on/off " +                                     "warnings about hash mismatch for comdat " +                                     "functions."));  // Command line option to enable/disable select instruction instrumentation. -static cl::opt<bool> PGOInstrSelect("pgo-instr-select", cl::init(true), -                                    cl::Hidden); +static cl::opt<bool> +    PGOInstrSelect("pgo-instr-select", cl::init(true), cl::Hidden, +                   cl::desc("Use this option to turn on/off SELECT " +                            "instruction instrumentation. ")); + +// Command line option to turn on CFG dot dump of raw profile counts +static cl::opt<bool> +    PGOViewRawCounts("pgo-view-raw-counts", cl::init(false), cl::Hidden, +                     cl::desc("A boolean option to show CFG dag " +                              "with raw profile counts from " +                              "profile data. See also option " +                              "-pgo-view-counts. To limit graph " +                              "display to only one function, use " +                              "filtering option -view-bfi-func-name.")); + +// Command line option to enable/disable memop intrinsic call.size profiling. +static cl::opt<bool> +    PGOInstrMemOP("pgo-instr-memop", cl::init(true), cl::Hidden, +                  cl::desc("Use this option to turn on/off " +                           "memory instrinsic size profiling.")); + +// Command line option to turn on CFG dot dump after profile annotation. +// Defined in Analysis/BlockFrequencyInfo.cpp:  -pgo-view-counts +extern cl::opt<bool> PGOViewCounts; + +// Command line option to specify the name of the function for CFG dump +// Defined in Analysis/BlockFrequencyInfo.cpp:  -view-bfi-func-name= +extern cl::opt<std::string> ViewBlockFreqFuncName; +  namespace {  /// The select instruction visitor plays three roles specified @@ -167,6 +214,7 @@ struct SelectInstVisitor : public InstVisitor<SelectInstVisitor> {    SelectInstVisitor(Function &Func) : F(Func) {}    void countSelects(Function &Func) { +    NSIs = 0;      Mode = VM_counting;      visit(Func);    } @@ -196,9 +244,54 @@ struct SelectInstVisitor : public InstVisitor<SelectInstVisitor> {    void annotateOneSelectInst(SelectInst &SI);    // Visit \p SI instruction and perform tasks according to visit mode.    void visitSelectInst(SelectInst &SI); +  // Return the number of select instructions. This needs be called after +  // countSelects().    unsigned getNumOfSelectInsts() const { return NSIs; }  }; +/// Instruction Visitor class to visit memory intrinsic calls. +struct MemIntrinsicVisitor : public InstVisitor<MemIntrinsicVisitor> { +  Function &F; +  unsigned NMemIs = 0;          // Number of memIntrinsics instrumented. +  VisitMode Mode = VM_counting; // Visiting mode. +  unsigned CurCtrId = 0;        // Current counter index. +  unsigned TotalNumCtrs = 0;    // Total number of counters +  GlobalVariable *FuncNameVar = nullptr; +  uint64_t FuncHash = 0; +  PGOUseFunc *UseFunc = nullptr; +  std::vector<Instruction *> Candidates; + +  MemIntrinsicVisitor(Function &Func) : F(Func) {} + +  void countMemIntrinsics(Function &Func) { +    NMemIs = 0; +    Mode = VM_counting; +    visit(Func); +  } + +  void instrumentMemIntrinsics(Function &Func, unsigned TotalNC, +                               GlobalVariable *FNV, uint64_t FHash) { +    Mode = VM_instrument; +    TotalNumCtrs = TotalNC; +    FuncHash = FHash; +    FuncNameVar = FNV; +    visit(Func); +  } + +  std::vector<Instruction *> findMemIntrinsics(Function &Func) { +    Candidates.clear(); +    Mode = VM_annotate; +    visit(Func); +    return Candidates; +  } + +  // Visit the IR stream and annotate all mem intrinsic call instructions. +  void instrumentOneMemIntrinsic(MemIntrinsic &MI); +  // Visit \p MI instruction and perform tasks according to visit mode. +  void visitMemIntrinsic(MemIntrinsic &SI); +  unsigned getNumOfMemIntrinsics() const { return NMemIs; } +}; +  class PGOInstrumentationGenLegacyPass : public ModulePass {  public:    static char ID; @@ -316,8 +409,9 @@ private:    std::unordered_multimap<Comdat *, GlobalValue *> &ComdatMembers;  public: -  std::vector<Instruction *> IndirectCallSites; +  std::vector<std::vector<Instruction *>> ValueSites;    SelectInstVisitor SIVisitor; +  MemIntrinsicVisitor MIVisitor;    std::string FuncName;    GlobalVariable *FuncNameVar;    // CFG hash value for this function. @@ -347,13 +441,16 @@ public:        std::unordered_multimap<Comdat *, GlobalValue *> &ComdatMembers,        bool CreateGlobalVar = false, BranchProbabilityInfo *BPI = nullptr,        BlockFrequencyInfo *BFI = nullptr) -      : F(Func), ComdatMembers(ComdatMembers), SIVisitor(Func), FunctionHash(0), -        MST(F, BPI, BFI) { +      : F(Func), ComdatMembers(ComdatMembers), ValueSites(IPVK_Last + 1), +        SIVisitor(Func), MIVisitor(Func), FunctionHash(0), MST(F, BPI, BFI) {      // This should be done before CFG hash computation.      SIVisitor.countSelects(Func); +    MIVisitor.countMemIntrinsics(Func);      NumOfPGOSelectInsts += SIVisitor.getNumOfSelectInsts(); -    IndirectCallSites = findIndirectCallSites(Func); +    NumOfPGOMemIntrinsics += MIVisitor.getNumOfMemIntrinsics(); +    ValueSites[IPVK_IndirectCallTarget] = findIndirectCallSites(Func); +    ValueSites[IPVK_MemOPSize] = MIVisitor.findMemIntrinsics(Func);      FuncName = getPGOFuncName(F);      computeCFGHash(); @@ -405,7 +502,7 @@ void FuncPGOInstrumentation<Edge, BBInfo>::computeCFGHash() {    }    JC.update(Indexes);    FunctionHash = (uint64_t)SIVisitor.getNumOfSelectInsts() << 56 | -                 (uint64_t)IndirectCallSites.size() << 48 | +                 (uint64_t)ValueSites[IPVK_IndirectCallTarget].size() << 48 |                   (uint64_t)MST.AllEdges.size() << 32 | JC.getCRC();  } @@ -552,7 +649,7 @@ static void instrumentOneFunc(      return;    unsigned NumIndirectCallSites = 0; -  for (auto &I : FuncInfo.IndirectCallSites) { +  for (auto &I : FuncInfo.ValueSites[IPVK_IndirectCallTarget]) {      CallSite CS(I);      Value *Callee = CS.getCalledValue();      DEBUG(dbgs() << "Instrument one indirect call: CallSite Index = " @@ -565,10 +662,14 @@ static void instrumentOneFunc(          {llvm::ConstantExpr::getBitCast(FuncInfo.FuncNameVar, I8PtrTy),           Builder.getInt64(FuncInfo.FunctionHash),           Builder.CreatePtrToInt(Callee, Builder.getInt64Ty()), -         Builder.getInt32(llvm::InstrProfValueKind::IPVK_IndirectCallTarget), +         Builder.getInt32(IPVK_IndirectCallTarget),           Builder.getInt32(NumIndirectCallSites++)});    }    NumOfPGOICall += NumIndirectCallSites; + +  // Now instrument memop intrinsic calls. +  FuncInfo.MIVisitor.instrumentMemIntrinsics( +      F, NumCounters, FuncInfo.FuncNameVar, FuncInfo.FunctionHash);  }  // This class represents a CFG edge in profile use compilation. @@ -653,8 +754,11 @@ public:    // Set the branch weights based on the count values.    void setBranchWeights(); -  // Annotate the indirect call sites. -  void annotateIndirectCallSites(); +  // Annotate the value profile call sites all all value kind. +  void annotateValueSites(); + +  // Annotate the value profile call sites for one value kind. +  void annotateValueSites(uint32_t Kind);    // The hotness of the function from the profile count.    enum FuncFreqAttr { FFA_Normal, FFA_Cold, FFA_Hot }; @@ -677,6 +781,8 @@ public:      return FuncInfo.findBBInfo(BB);    } +  Function &getFunc() const { return F; } +  private:    Function &F;    Module *M; @@ -761,7 +867,7 @@ void PGOUseFunc::setInstrumentedCounts(      NewEdge1.InMST = true;      getBBInfo(InstrBB).setBBInfoCount(CountValue);    } -  ProfileCountSize =  CountFromProfile.size(); +  ProfileCountSize = CountFromProfile.size();    CountPosition = I;  } @@ -932,21 +1038,6 @@ void PGOUseFunc::populateCounters() {    DEBUG(FuncInfo.dumpInfo("after reading profile."));  } -static void setProfMetadata(Module *M, Instruction *TI, -                            ArrayRef<uint64_t> EdgeCounts, uint64_t MaxCount) { -  MDBuilder MDB(M->getContext()); -  assert(MaxCount > 0 && "Bad max count"); -  uint64_t Scale = calculateCountScale(MaxCount); -  SmallVector<unsigned, 4> Weights; -  for (const auto &ECI : EdgeCounts) -    Weights.push_back(scaleBranchCount(ECI, Scale)); - -  DEBUG(dbgs() << "Weight is: "; -        for (const auto &W : Weights) { dbgs() << W << " "; }  -        dbgs() << "\n";); -  TI->setMetadata(llvm::LLVMContext::MD_prof, MDB.createBranchWeights(Weights)); -} -  // Assign the scaled count values to the BB with multiple out edges.  void PGOUseFunc::setBranchWeights() {    // Generate MD_prof metadata for every branch instruction. @@ -990,8 +1081,8 @@ void SelectInstVisitor::instrumentOneSelectInst(SelectInst &SI) {    Builder.CreateCall(        Intrinsic::getDeclaration(M, Intrinsic::instrprof_increment_step),        {llvm::ConstantExpr::getBitCast(FuncNameVar, I8PtrTy), -       Builder.getInt64(FuncHash), -       Builder.getInt32(TotalNumCtrs), Builder.getInt32(*CurCtrIdx), Step}); +       Builder.getInt64(FuncHash), Builder.getInt32(TotalNumCtrs), +       Builder.getInt32(*CurCtrIdx), Step});    ++(*CurCtrIdx);  } @@ -1020,9 +1111,9 @@ void SelectInstVisitor::visitSelectInst(SelectInst &SI) {    if (SI.getCondition()->getType()->isVectorTy())      return; -  NSIs++;    switch (Mode) {    case VM_counting: +    NSIs++;      return;    case VM_instrument:      instrumentOneSelectInst(SI); @@ -1035,35 +1126,79 @@ void SelectInstVisitor::visitSelectInst(SelectInst &SI) {    llvm_unreachable("Unknown visiting mode");  } -// Traverse all the indirect callsites and annotate the instructions. -void PGOUseFunc::annotateIndirectCallSites() { +void MemIntrinsicVisitor::instrumentOneMemIntrinsic(MemIntrinsic &MI) { +  Module *M = F.getParent(); +  IRBuilder<> Builder(&MI); +  Type *Int64Ty = Builder.getInt64Ty(); +  Type *I8PtrTy = Builder.getInt8PtrTy(); +  Value *Length = MI.getLength(); +  assert(!dyn_cast<ConstantInt>(Length)); +  Builder.CreateCall( +      Intrinsic::getDeclaration(M, Intrinsic::instrprof_value_profile), +      {llvm::ConstantExpr::getBitCast(FuncNameVar, I8PtrTy), +       Builder.getInt64(FuncHash), Builder.CreatePtrToInt(Length, Int64Ty), +       Builder.getInt32(IPVK_MemOPSize), Builder.getInt32(CurCtrId)}); +  ++CurCtrId; +} + +void MemIntrinsicVisitor::visitMemIntrinsic(MemIntrinsic &MI) { +  if (!PGOInstrMemOP) +    return; +  Value *Length = MI.getLength(); +  // Not instrument constant length calls. +  if (dyn_cast<ConstantInt>(Length)) +    return; + +  switch (Mode) { +  case VM_counting: +    NMemIs++; +    return; +  case VM_instrument: +    instrumentOneMemIntrinsic(MI); +    return; +  case VM_annotate: +    Candidates.push_back(&MI); +    return; +  } +  llvm_unreachable("Unknown visiting mode"); +} + +// Traverse all valuesites and annotate the instructions for all value kind. +void PGOUseFunc::annotateValueSites() {    if (DisableValueProfiling)      return;    // Create the PGOFuncName meta data.    createPGOFuncNameMetadata(F, FuncInfo.FuncName); -  unsigned IndirectCallSiteIndex = 0; -  auto &IndirectCallSites = FuncInfo.IndirectCallSites; -  unsigned NumValueSites = -      ProfileRecord.getNumValueSites(IPVK_IndirectCallTarget); -  if (NumValueSites != IndirectCallSites.size()) { -    std::string Msg = -        std::string("Inconsistent number of indirect call sites: ") + -        F.getName().str(); +  for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) +    annotateValueSites(Kind); +} + +// Annotate the instructions for a specific value kind. +void PGOUseFunc::annotateValueSites(uint32_t Kind) { +  unsigned ValueSiteIndex = 0; +  auto &ValueSites = FuncInfo.ValueSites[Kind]; +  unsigned NumValueSites = ProfileRecord.getNumValueSites(Kind); +  if (NumValueSites != ValueSites.size()) {      auto &Ctx = M->getContext(); -    Ctx.diagnose( -        DiagnosticInfoPGOProfile(M->getName().data(), Msg, DS_Warning)); +    Ctx.diagnose(DiagnosticInfoPGOProfile( +        M->getName().data(), +        Twine("Inconsistent number of value sites for kind = ") + Twine(Kind) + +            " in " + F.getName().str(), +        DS_Warning));      return;    } -  for (auto &I : IndirectCallSites) { -    DEBUG(dbgs() << "Read one indirect call instrumentation: Index=" -                 << IndirectCallSiteIndex << " out of " << NumValueSites -                 << "\n"); -    annotateValueSite(*M, *I, ProfileRecord, IPVK_IndirectCallTarget, -                      IndirectCallSiteIndex, MaxNumAnnotations); -    IndirectCallSiteIndex++; +  for (auto &I : ValueSites) { +    DEBUG(dbgs() << "Read one value site profile (kind = " << Kind +                 << "): Index = " << ValueSiteIndex << " out of " +                 << NumValueSites << "\n"); +    annotateValueSite(*M, *I, ProfileRecord, +                      static_cast<InstrProfValueKind>(Kind), ValueSiteIndex, +                      Kind == IPVK_MemOPSize ? MaxNumMemOPAnnotations +                                             : MaxNumAnnotations); +    ValueSiteIndex++;    }  }  } // end anonymous namespace @@ -1196,12 +1331,29 @@ static bool annotateAllFunctions(        continue;      Func.populateCounters();      Func.setBranchWeights(); -    Func.annotateIndirectCallSites(); +    Func.annotateValueSites();      PGOUseFunc::FuncFreqAttr FreqAttr = Func.getFuncFreqAttr();      if (FreqAttr == PGOUseFunc::FFA_Cold)        ColdFunctions.push_back(&F);      else if (FreqAttr == PGOUseFunc::FFA_Hot)        HotFunctions.push_back(&F); +    if (PGOViewCounts && (ViewBlockFreqFuncName.empty() || +                          F.getName().equals(ViewBlockFreqFuncName))) { +      LoopInfo LI{DominatorTree(F)}; +      std::unique_ptr<BranchProbabilityInfo> NewBPI = +          llvm::make_unique<BranchProbabilityInfo>(F, LI); +      std::unique_ptr<BlockFrequencyInfo> NewBFI = +          llvm::make_unique<BlockFrequencyInfo>(F, *NewBPI, LI); + +      NewBFI->view(); +    } +    if (PGOViewRawCounts && (ViewBlockFreqFuncName.empty() || +                             F.getName().equals(ViewBlockFreqFuncName))) { +      if (ViewBlockFreqFuncName.empty()) +        WriteGraph(&Func, Twine("PGORawCounts_") + Func.getFunc().getName()); +      else +        ViewGraph(&Func, Twine("PGORawCounts_") + Func.getFunc().getName()); +    }    }    M.setProfileSummary(PGOReader->getSummary().getMD(M.getContext()));    // Set function hotness attribute from the profile. @@ -1257,3 +1409,90 @@ bool PGOInstrumentationUseLegacyPass::runOnModule(Module &M) {    return annotateAllFunctions(M, ProfileFileName, LookupBPI, LookupBFI);  } + +namespace llvm { +void setProfMetadata(Module *M, Instruction *TI, ArrayRef<uint64_t> EdgeCounts, +                     uint64_t MaxCount) { +  MDBuilder MDB(M->getContext()); +  assert(MaxCount > 0 && "Bad max count"); +  uint64_t Scale = calculateCountScale(MaxCount); +  SmallVector<unsigned, 4> Weights; +  for (const auto &ECI : EdgeCounts) +    Weights.push_back(scaleBranchCount(ECI, Scale)); + +  DEBUG(dbgs() << "Weight is: "; +        for (const auto &W : Weights) { dbgs() << W << " "; } +        dbgs() << "\n";); +  TI->setMetadata(llvm::LLVMContext::MD_prof, MDB.createBranchWeights(Weights)); +} + +template <> struct GraphTraits<PGOUseFunc *> { +  typedef const BasicBlock *NodeRef; +  typedef succ_const_iterator ChildIteratorType; +  typedef pointer_iterator<Function::const_iterator> nodes_iterator; + +  static NodeRef getEntryNode(const PGOUseFunc *G) { +    return &G->getFunc().front(); +  } +  static ChildIteratorType child_begin(const NodeRef N) { +    return succ_begin(N); +  } +  static ChildIteratorType child_end(const NodeRef N) { return succ_end(N); } +  static nodes_iterator nodes_begin(const PGOUseFunc *G) { +    return nodes_iterator(G->getFunc().begin()); +  } +  static nodes_iterator nodes_end(const PGOUseFunc *G) { +    return nodes_iterator(G->getFunc().end()); +  } +}; + +static std::string getSimpleNodeName(const BasicBlock *Node) { +  if (!Node->getName().empty()) +    return Node->getName(); + +  std::string SimpleNodeName; +  raw_string_ostream OS(SimpleNodeName); +  Node->printAsOperand(OS, false); +  return OS.str(); +} + +template <> struct DOTGraphTraits<PGOUseFunc *> : DefaultDOTGraphTraits { +  explicit DOTGraphTraits(bool isSimple = false) +      : DefaultDOTGraphTraits(isSimple) {} + +  static std::string getGraphName(const PGOUseFunc *G) { +    return G->getFunc().getName(); +  } + +  std::string getNodeLabel(const BasicBlock *Node, const PGOUseFunc *Graph) { +    std::string Result; +    raw_string_ostream OS(Result); + +    OS << getSimpleNodeName(Node) << ":\\l"; +    UseBBInfo *BI = Graph->findBBInfo(Node); +    OS << "Count : "; +    if (BI && BI->CountValid) +      OS << BI->CountValue << "\\l"; +    else +      OS << "Unknown\\l"; + +    if (!PGOInstrSelect) +      return Result; + +    for (auto BI = Node->begin(); BI != Node->end(); ++BI) { +      auto *I = &*BI; +      if (!isa<SelectInst>(I)) +        continue; +      // Display scaled counts for SELECT instruction: +      OS << "SELECT : { T = "; +      uint64_t TC, FC; +      bool HasProf = I->extractProfMetadata(TC, FC); +      if (!HasProf) +        OS << "Unknown, F = Unknown }\\l"; +      else +        OS << TC << ", F = " << FC << " }\\l"; +    } +    return Result; +  } +}; +} // namespace llvm diff --git a/lib/Transforms/Instrumentation/SanitizerCoverage.cpp b/lib/Transforms/Instrumentation/SanitizerCoverage.cpp index 5b4b1fb77134..fa0c7cc5a4c5 100644 --- a/lib/Transforms/Instrumentation/SanitizerCoverage.cpp +++ b/lib/Transforms/Instrumentation/SanitizerCoverage.cpp @@ -78,7 +78,6 @@ static const char *const SanCovTraceSwitchName = "__sanitizer_cov_trace_switch";  static const char *const SanCovModuleCtorName = "sancov.module_ctor";  static const uint64_t SanCtorAndDtorPriority = 2; -static const char *const SanCovTracePCGuardSection = "__sancov_guards";  static const char *const SanCovTracePCGuardName =      "__sanitizer_cov_trace_pc_guard";  static const char *const SanCovTracePCGuardInitName = @@ -95,7 +94,7 @@ static cl::opt<unsigned> ClCoverageBlockThreshold(      "sanitizer-coverage-block-threshold",      cl::desc("Use a callback with a guard check inside it if there are"               " more than this number of blocks."), -    cl::Hidden, cl::init(500)); +    cl::Hidden, cl::init(0));  static cl::opt<bool>      ClExperimentalTracing("sanitizer-coverage-experimental-tracing", @@ -216,6 +215,9 @@ private:             SanCovWithCheckFunction->getNumUses() + SanCovTraceBB->getNumUses() +             SanCovTraceEnter->getNumUses();    } +  StringRef getSanCovTracePCGuardSection() const; +  StringRef getSanCovTracePCGuardSectionStart() const; +  StringRef getSanCovTracePCGuardSectionEnd() const;    Function *SanCovFunction;    Function *SanCovWithCheckFunction;    Function *SanCovIndirCallFunction, *SanCovTracePCIndir; @@ -227,6 +229,7 @@ private:    InlineAsm *EmptyAsm;    Type *IntptrTy, *IntptrPtrTy, *Int64Ty, *Int64PtrTy, *Int32Ty, *Int32PtrTy;    Module *CurModule; +  Triple TargetTriple;    LLVMContext *C;    const DataLayout *DL; @@ -246,6 +249,7 @@ bool SanitizerCoverageModule::runOnModule(Module &M) {    C = &(M.getContext());    DL = &M.getDataLayout();    CurModule = &M; +  TargetTriple = Triple(M.getTargetTriple());    HasSancovGuardsSection = false;    IntptrTy = Type::getIntNTy(*C, DL->getPointerSizeInBits());    IntptrPtrTy = PointerType::getUnqual(IntptrTy); @@ -258,39 +262,39 @@ bool SanitizerCoverageModule::runOnModule(Module &M) {    Int32Ty = IRB.getInt32Ty();    SanCovFunction = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction(SanCovName, VoidTy, Int32PtrTy, nullptr)); +      M.getOrInsertFunction(SanCovName, VoidTy, Int32PtrTy));    SanCovWithCheckFunction = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction(SanCovWithCheckName, VoidTy, Int32PtrTy, nullptr)); +      M.getOrInsertFunction(SanCovWithCheckName, VoidTy, Int32PtrTy));    SanCovTracePCIndir = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction(SanCovTracePCIndirName, VoidTy, IntptrTy, nullptr)); +      M.getOrInsertFunction(SanCovTracePCIndirName, VoidTy, IntptrTy));    SanCovIndirCallFunction =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          SanCovIndirCallName, VoidTy, IntptrTy, IntptrTy, nullptr)); +          SanCovIndirCallName, VoidTy, IntptrTy, IntptrTy));    SanCovTraceCmpFunction[0] =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          SanCovTraceCmp1, VoidTy, IRB.getInt8Ty(), IRB.getInt8Ty(), nullptr)); +          SanCovTraceCmp1, VoidTy, IRB.getInt8Ty(), IRB.getInt8Ty()));    SanCovTraceCmpFunction[1] = checkSanitizerInterfaceFunction(        M.getOrInsertFunction(SanCovTraceCmp2, VoidTy, IRB.getInt16Ty(), -                            IRB.getInt16Ty(), nullptr)); +                            IRB.getInt16Ty()));    SanCovTraceCmpFunction[2] = checkSanitizerInterfaceFunction(        M.getOrInsertFunction(SanCovTraceCmp4, VoidTy, IRB.getInt32Ty(), -                            IRB.getInt32Ty(), nullptr)); +                            IRB.getInt32Ty()));    SanCovTraceCmpFunction[3] =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          SanCovTraceCmp8, VoidTy, Int64Ty, Int64Ty, nullptr)); +          SanCovTraceCmp8, VoidTy, Int64Ty, Int64Ty));    SanCovTraceDivFunction[0] =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          SanCovTraceDiv4, VoidTy, IRB.getInt32Ty(), nullptr)); +          SanCovTraceDiv4, VoidTy, IRB.getInt32Ty()));    SanCovTraceDivFunction[1] =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          SanCovTraceDiv8, VoidTy, Int64Ty, nullptr)); +          SanCovTraceDiv8, VoidTy, Int64Ty));    SanCovTraceGepFunction =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          SanCovTraceGep, VoidTy, IntptrTy, nullptr)); +          SanCovTraceGep, VoidTy, IntptrTy));    SanCovTraceSwitchFunction =        checkSanitizerInterfaceFunction(M.getOrInsertFunction( -          SanCovTraceSwitchName, VoidTy, Int64Ty, Int64PtrTy, nullptr)); +          SanCovTraceSwitchName, VoidTy, Int64Ty, Int64PtrTy));    // We insert an empty inline asm after cov callbacks to avoid callback merge.    EmptyAsm = InlineAsm::get(FunctionType::get(IRB.getVoidTy(), false), @@ -298,13 +302,13 @@ bool SanitizerCoverageModule::runOnModule(Module &M) {                              /*hasSideEffects=*/true);    SanCovTracePC = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction(SanCovTracePCName, VoidTy, nullptr)); +      M.getOrInsertFunction(SanCovTracePCName, VoidTy));    SanCovTracePCGuard = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      SanCovTracePCGuardName, VoidTy, Int32PtrTy, nullptr)); +      SanCovTracePCGuardName, VoidTy, Int32PtrTy));    SanCovTraceEnter = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction(SanCovTraceEnterName, VoidTy, Int32PtrTy, nullptr)); +      M.getOrInsertFunction(SanCovTraceEnterName, VoidTy, Int32PtrTy));    SanCovTraceBB = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction(SanCovTraceBBName, VoidTy, Int32PtrTy, nullptr)); +      M.getOrInsertFunction(SanCovTraceBBName, VoidTy, Int32PtrTy));    // At this point we create a dummy array of guards because we don't    // know how many elements we will need. @@ -363,22 +367,28 @@ bool SanitizerCoverageModule::runOnModule(Module &M) {    if (Options.TracePCGuard) {      if (HasSancovGuardsSection) {        Function *CtorFunc; -      std::string SectionName(SanCovTracePCGuardSection); -      GlobalVariable *Bounds[2]; -      const char *Prefix[2] = {"__start_", "__stop_"}; -      for (int i = 0; i < 2; i++) { -        Bounds[i] = new GlobalVariable(M, Int32PtrTy, false, -                                       GlobalVariable::ExternalLinkage, nullptr, -                                       Prefix[i] + SectionName); -        Bounds[i]->setVisibility(GlobalValue::HiddenVisibility); -      } +      GlobalVariable *SecStart = new GlobalVariable( +          M, Int32PtrTy, false, GlobalVariable::ExternalLinkage, nullptr, +          getSanCovTracePCGuardSectionStart()); +      SecStart->setVisibility(GlobalValue::HiddenVisibility); +      GlobalVariable *SecEnd = new GlobalVariable( +          M, Int32PtrTy, false, GlobalVariable::ExternalLinkage, nullptr, +          getSanCovTracePCGuardSectionEnd()); +      SecEnd->setVisibility(GlobalValue::HiddenVisibility); +        std::tie(CtorFunc, std::ignore) = createSanitizerCtorAndInitFunctions(            M, SanCovModuleCtorName, SanCovTracePCGuardInitName,            {Int32PtrTy, Int32PtrTy}, -          {IRB.CreatePointerCast(Bounds[0], Int32PtrTy), -            IRB.CreatePointerCast(Bounds[1], Int32PtrTy)}); - -      appendToGlobalCtors(M, CtorFunc, SanCtorAndDtorPriority); +          {IRB.CreatePointerCast(SecStart, Int32PtrTy), +            IRB.CreatePointerCast(SecEnd, Int32PtrTy)}); + +      if (TargetTriple.supportsCOMDAT()) { +        // Use comdat to dedup CtorFunc. +        CtorFunc->setComdat(M.getOrInsertComdat(SanCovModuleCtorName)); +        appendToGlobalCtors(M, CtorFunc, SanCtorAndDtorPriority, CtorFunc); +      } else { +        appendToGlobalCtors(M, CtorFunc, SanCtorAndDtorPriority); +      }      }    } else if (!Options.TracePC) {      Function *CtorFunc; @@ -435,6 +445,11 @@ static bool shouldInstrumentBlock(const Function& F, const BasicBlock *BB, const    if (isa<UnreachableInst>(BB->getTerminator()))      return false; +  // Don't insert coverage into blocks without a valid insertion point +  // (catchswitch blocks). +  if (BB->getFirstInsertionPt() == BB->end()) +    return false; +    if (!ClPruneBlocks || &F.getEntryBlock() == BB)      return true; @@ -517,7 +532,7 @@ void SanitizerCoverageModule::CreateFunctionGuardArray(size_t NumGuards,        Constant::getNullValue(ArrayOfInt32Ty), "__sancov_gen_");    if (auto Comdat = F.getComdat())      FunctionGuardArray->setComdat(Comdat); -  FunctionGuardArray->setSection(SanCovTracePCGuardSection); +  FunctionGuardArray->setSection(getSanCovTracePCGuardSection());  }  bool SanitizerCoverageModule::InjectCoverage(Function &F, @@ -755,6 +770,27 @@ void SanitizerCoverageModule::InjectCoverageAtBlock(Function &F, BasicBlock &BB,    }  } +StringRef SanitizerCoverageModule::getSanCovTracePCGuardSection() const { +  if (TargetTriple.getObjectFormat() == Triple::COFF) +    return ".SCOV$M"; +  if (TargetTriple.isOSBinFormatMachO()) +    return "__DATA,__sancov_guards"; +  return "__sancov_guards"; +} + +StringRef SanitizerCoverageModule::getSanCovTracePCGuardSectionStart() const { +  if (TargetTriple.isOSBinFormatMachO()) +    return "\1section$start$__DATA$__sancov_guards"; +  return "__start___sancov_guards"; +} + +StringRef SanitizerCoverageModule::getSanCovTracePCGuardSectionEnd() const { +  if (TargetTriple.isOSBinFormatMachO()) +    return "\1section$end$__DATA$__sancov_guards"; +  return "__stop___sancov_guards"; +} + +  char SanitizerCoverageModule::ID = 0;  INITIALIZE_PASS_BEGIN(SanitizerCoverageModule, "sancov",                        "SanitizerCoverage: TODO." diff --git a/lib/Transforms/Instrumentation/ThreadSanitizer.cpp b/lib/Transforms/Instrumentation/ThreadSanitizer.cpp index 52035c79a4a3..9260217bd5e6 100644 --- a/lib/Transforms/Instrumentation/ThreadSanitizer.cpp +++ b/lib/Transforms/Instrumentation/ThreadSanitizer.cpp @@ -155,17 +155,18 @@ FunctionPass *llvm::createThreadSanitizerPass() {  void ThreadSanitizer::initializeCallbacks(Module &M) {    IRBuilder<> IRB(M.getContext()); -  AttributeSet Attr; -  Attr = Attr.addAttribute(M.getContext(), AttributeSet::FunctionIndex, Attribute::NoUnwind); +  AttributeList Attr; +  Attr = Attr.addAttribute(M.getContext(), AttributeList::FunctionIndex, +                           Attribute::NoUnwind);    // Initialize the callbacks.    TsanFuncEntry = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      "__tsan_func_entry", Attr, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +      "__tsan_func_entry", Attr, IRB.getVoidTy(), IRB.getInt8PtrTy()));    TsanFuncExit = checkSanitizerInterfaceFunction( -      M.getOrInsertFunction("__tsan_func_exit", Attr, IRB.getVoidTy(), nullptr)); +      M.getOrInsertFunction("__tsan_func_exit", Attr, IRB.getVoidTy()));    TsanIgnoreBegin = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      "__tsan_ignore_thread_begin", Attr, IRB.getVoidTy(), nullptr)); +      "__tsan_ignore_thread_begin", Attr, IRB.getVoidTy()));    TsanIgnoreEnd = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      "__tsan_ignore_thread_end", Attr, IRB.getVoidTy(), nullptr)); +      "__tsan_ignore_thread_end", Attr, IRB.getVoidTy()));    OrdTy = IRB.getInt32Ty();    for (size_t i = 0; i < kNumberOfAccessSizes; ++i) {      const unsigned ByteSize = 1U << i; @@ -174,31 +175,31 @@ void ThreadSanitizer::initializeCallbacks(Module &M) {      std::string BitSizeStr = utostr(BitSize);      SmallString<32> ReadName("__tsan_read" + ByteSizeStr);      TsanRead[i] = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -        ReadName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +        ReadName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy()));      SmallString<32> WriteName("__tsan_write" + ByteSizeStr);      TsanWrite[i] = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -        WriteName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +        WriteName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy()));      SmallString<64> UnalignedReadName("__tsan_unaligned_read" + ByteSizeStr);      TsanUnalignedRead[i] =          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -            UnalignedReadName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +            UnalignedReadName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy()));      SmallString<64> UnalignedWriteName("__tsan_unaligned_write" + ByteSizeStr);      TsanUnalignedWrite[i] =          checkSanitizerInterfaceFunction(M.getOrInsertFunction( -            UnalignedWriteName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +            UnalignedWriteName, Attr, IRB.getVoidTy(), IRB.getInt8PtrTy()));      Type *Ty = Type::getIntNTy(M.getContext(), BitSize);      Type *PtrTy = Ty->getPointerTo();      SmallString<32> AtomicLoadName("__tsan_atomic" + BitSizeStr + "_load");      TsanAtomicLoad[i] = checkSanitizerInterfaceFunction( -        M.getOrInsertFunction(AtomicLoadName, Attr, Ty, PtrTy, OrdTy, nullptr)); +        M.getOrInsertFunction(AtomicLoadName, Attr, Ty, PtrTy, OrdTy));      SmallString<32> AtomicStoreName("__tsan_atomic" + BitSizeStr + "_store");      TsanAtomicStore[i] = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -        AtomicStoreName, Attr, IRB.getVoidTy(), PtrTy, Ty, OrdTy, nullptr)); +        AtomicStoreName, Attr, IRB.getVoidTy(), PtrTy, Ty, OrdTy));      for (int op = AtomicRMWInst::FIRST_BINOP;          op <= AtomicRMWInst::LAST_BINOP; ++op) { @@ -222,33 +223,33 @@ void ThreadSanitizer::initializeCallbacks(Module &M) {          continue;        SmallString<32> RMWName("__tsan_atomic" + itostr(BitSize) + NamePart);        TsanAtomicRMW[op][i] = checkSanitizerInterfaceFunction( -          M.getOrInsertFunction(RMWName, Attr, Ty, PtrTy, Ty, OrdTy, nullptr)); +          M.getOrInsertFunction(RMWName, Attr, Ty, PtrTy, Ty, OrdTy));      }      SmallString<32> AtomicCASName("__tsan_atomic" + BitSizeStr +                                    "_compare_exchange_val");      TsanAtomicCAS[i] = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -        AtomicCASName, Attr, Ty, PtrTy, Ty, Ty, OrdTy, OrdTy, nullptr)); +        AtomicCASName, Attr, Ty, PtrTy, Ty, Ty, OrdTy, OrdTy));    }    TsanVptrUpdate = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("__tsan_vptr_update", Attr, IRB.getVoidTy(), -                            IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), nullptr)); +                            IRB.getInt8PtrTy(), IRB.getInt8PtrTy()));    TsanVptrLoad = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      "__tsan_vptr_read", Attr, IRB.getVoidTy(), IRB.getInt8PtrTy(), nullptr)); +      "__tsan_vptr_read", Attr, IRB.getVoidTy(), IRB.getInt8PtrTy()));    TsanAtomicThreadFence = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      "__tsan_atomic_thread_fence", Attr, IRB.getVoidTy(), OrdTy, nullptr)); +      "__tsan_atomic_thread_fence", Attr, IRB.getVoidTy(), OrdTy));    TsanAtomicSignalFence = checkSanitizerInterfaceFunction(M.getOrInsertFunction( -      "__tsan_atomic_signal_fence", Attr, IRB.getVoidTy(), OrdTy, nullptr)); +      "__tsan_atomic_signal_fence", Attr, IRB.getVoidTy(), OrdTy));    MemmoveFn = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("memmove", Attr, IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -                            IRB.getInt8PtrTy(), IntptrTy, nullptr)); +                            IRB.getInt8PtrTy(), IntptrTy));    MemcpyFn = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("memcpy", Attr, IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -                            IRB.getInt8PtrTy(), IntptrTy, nullptr)); +                            IRB.getInt8PtrTy(), IntptrTy));    MemsetFn = checkSanitizerInterfaceFunction(        M.getOrInsertFunction("memset", Attr, IRB.getInt8PtrTy(), IRB.getInt8PtrTy(), -                            IRB.getInt32Ty(), IntptrTy, nullptr)); +                            IRB.getInt32Ty(), IntptrTy));  }  bool ThreadSanitizer::doInitialization(Module &M) { @@ -271,7 +272,7 @@ static bool isVtableAccess(Instruction *I) {  // Do not instrument known races/"benign races" that come from compiler  // instrumentatin. The user has no way of suppressing them. -static bool shouldInstrumentReadWriteFromAddress(Value *Addr) { +static bool shouldInstrumentReadWriteFromAddress(const Module *M, Value *Addr) {    // Peel off GEPs and BitCasts.    Addr = Addr->stripInBoundsOffsets(); @@ -279,8 +280,9 @@ static bool shouldInstrumentReadWriteFromAddress(Value *Addr) {      if (GV->hasSection()) {        StringRef SectionName = GV->getSection();        // Check if the global is in the PGO counters section. -      if (SectionName.endswith(getInstrProfCountersSectionName( -            /*AddSegment=*/false))) +      auto OF = Triple(M->getTargetTriple()).getObjectFormat(); +      if (SectionName.endswith( +              getInstrProfSectionName(IPSK_cnts, OF, /*AddSegmentInfo=*/false)))          return false;      } @@ -342,13 +344,13 @@ void ThreadSanitizer::chooseInstructionsToInstrument(    for (Instruction *I : reverse(Local)) {      if (StoreInst *Store = dyn_cast<StoreInst>(I)) {        Value *Addr = Store->getPointerOperand(); -      if (!shouldInstrumentReadWriteFromAddress(Addr)) +      if (!shouldInstrumentReadWriteFromAddress(I->getModule(), Addr))          continue;        WriteTargets.insert(Addr);      } else {        LoadInst *Load = cast<LoadInst>(I);        Value *Addr = Load->getPointerOperand(); -      if (!shouldInstrumentReadWriteFromAddress(Addr)) +      if (!shouldInstrumentReadWriteFromAddress(I->getModule(), Addr))          continue;        if (WriteTargets.count(Addr)) {          // We will write to this temp, so no reason to analyze the read. | 
