1 //===- JMCInstrumenter.cpp - JMC Instrumentation --------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // JMCInstrumenter pass:
10 // - instrument each function with a call to __CheckForDebuggerJustMyCode. The
11 //   sole argument should be defined in .msvcjmc. Each flag is 1 byte initilized
12 //   to 1.
13 // - create the dummy COMDAT function __JustMyCode_Default to prevent linking
14 //   error if __CheckForDebuggerJustMyCode is not available.
15 // - For MSVC:
16 //   add "/alternatename:__CheckForDebuggerJustMyCode=__JustMyCode_Default" to
17 //   "llvm.linker.options"
18 //   For ELF:
19 //   Rename __JustMyCode_Default to __CheckForDebuggerJustMyCode and mark it as
20 //   weak symbol.
21 //===----------------------------------------------------------------------===//
22 
23 #include "llvm/CodeGen/JMCInstrumenter.h"
24 #include "llvm/ADT/SmallString.h"
25 #include "llvm/ADT/StringExtras.h"
26 #include "llvm/CodeGen/Passes.h"
27 #include "llvm/IR/DIBuilder.h"
28 #include "llvm/IR/DebugInfoMetadata.h"
29 #include "llvm/IR/DerivedTypes.h"
30 #include "llvm/IR/Function.h"
31 #include "llvm/IR/Instructions.h"
32 #include "llvm/IR/LLVMContext.h"
33 #include "llvm/IR/Module.h"
34 #include "llvm/IR/Type.h"
35 #include "llvm/InitializePasses.h"
36 #include "llvm/Pass.h"
37 #include "llvm/Support/DJB.h"
38 #include "llvm/Support/Path.h"
39 #include "llvm/Transforms/Utils/ModuleUtils.h"
40 
41 using namespace llvm;
42 
43 #define DEBUG_TYPE "jmc-instrumenter"
44 
45 static bool runImpl(Module &M);
46 namespace {
47 struct JMCInstrumenter : public ModulePass {
48   static char ID;
JMCInstrumenter__anon8384c81e0111::JMCInstrumenter49   JMCInstrumenter() : ModulePass(ID) {
50     initializeJMCInstrumenterPass(*PassRegistry::getPassRegistry());
51   }
runOnModule__anon8384c81e0111::JMCInstrumenter52   bool runOnModule(Module &M) override { return runImpl(M); }
53 };
54 char JMCInstrumenter::ID = 0;
55 } // namespace
56 
run(Module & M,ModuleAnalysisManager &)57 PreservedAnalyses JMCInstrumenterPass::run(Module &M, ModuleAnalysisManager &) {
58   bool Changed = runImpl(M);
59   return Changed ? PreservedAnalyses::none() : PreservedAnalyses::all();
60 }
61 
62 INITIALIZE_PASS(
63     JMCInstrumenter, DEBUG_TYPE,
64     "Instrument function entry with call to __CheckForDebuggerJustMyCode",
65     false, false)
66 
createJMCInstrumenterPass()67 ModulePass *llvm::createJMCInstrumenterPass() { return new JMCInstrumenter(); }
68 
69 namespace {
70 const char CheckFunctionName[] = "__CheckForDebuggerJustMyCode";
71 
getFlagName(DISubprogram & SP,bool UseX86FastCall)72 std::string getFlagName(DISubprogram &SP, bool UseX86FastCall) {
73   // absolute windows path:           windows_backslash
74   // relative windows backslash path: windows_backslash
75   // relative windows slash path:     posix
76   // absolute posix path:             posix
77   // relative posix path:             posix
78   sys::path::Style PathStyle =
79       has_root_name(SP.getDirectory(), sys::path::Style::windows_backslash) ||
80               SP.getDirectory().contains("\\") ||
81               SP.getFilename().contains("\\")
82           ? sys::path::Style::windows_backslash
83           : sys::path::Style::posix;
84   // Best effort path normalization. This is to guarantee an unique flag symbol
85   // is produced for the same directory. Some builds may want to use relative
86   // paths, or paths with a specific prefix (see the -fdebug-compilation-dir
87   // flag), so only hash paths in debuginfo. Don't expand them to absolute
88   // paths.
89   SmallString<256> FilePath(SP.getDirectory());
90   sys::path::append(FilePath, PathStyle, SP.getFilename());
91   sys::path::native(FilePath, PathStyle);
92   sys::path::remove_dots(FilePath, /*remove_dot_dot=*/true, PathStyle);
93 
94   // The naming convention for the flag name is __<hash>_<file name> with '.' in
95   // <file name> replaced with '@'. For example C:\file.any.c would have a flag
96   // __D032E919_file@any@c. The naming convention match MSVC's format however
97   // the match is not required to make JMC work. The hashing function used here
98   // is different from MSVC's.
99 
100   std::string Suffix;
101   for (auto C : sys::path::filename(FilePath, PathStyle))
102     Suffix.push_back(C == '.' ? '@' : C);
103 
104   sys::path::remove_filename(FilePath, PathStyle);
105   return (UseX86FastCall ? "_" : "__") +
106          utohexstr(djbHash(FilePath), /*LowerCase=*/false,
107                    /*Width=*/8) +
108          "_" + Suffix;
109 }
110 
attachDebugInfo(GlobalVariable & GV,DISubprogram & SP)111 void attachDebugInfo(GlobalVariable &GV, DISubprogram &SP) {
112   Module &M = *GV.getParent();
113   DICompileUnit *CU = SP.getUnit();
114   assert(CU);
115   DIBuilder DB(M, false, CU);
116 
117   auto *DType =
118       DB.createBasicType("unsigned char", 8, dwarf::DW_ATE_unsigned_char,
119                          llvm::DINode::FlagArtificial);
120 
121   auto *DGVE = DB.createGlobalVariableExpression(
122       CU, GV.getName(), /*LinkageName=*/StringRef(), SP.getFile(),
123       /*LineNo=*/0, DType, /*IsLocalToUnit=*/true, /*IsDefined=*/true);
124   GV.addMetadata(LLVMContext::MD_dbg, *DGVE);
125   DB.finalize();
126 }
127 
getCheckFunctionType(LLVMContext & Ctx)128 FunctionType *getCheckFunctionType(LLVMContext &Ctx) {
129   Type *VoidTy = Type::getVoidTy(Ctx);
130   PointerType *VoidPtrTy = PointerType::getUnqual(Ctx);
131   return FunctionType::get(VoidTy, VoidPtrTy, false);
132 }
133 
createDefaultCheckFunction(Module & M,bool UseX86FastCall)134 Function *createDefaultCheckFunction(Module &M, bool UseX86FastCall) {
135   LLVMContext &Ctx = M.getContext();
136   const char *DefaultCheckFunctionName =
137       UseX86FastCall ? "_JustMyCode_Default" : "__JustMyCode_Default";
138   // Create the function.
139   Function *DefaultCheckFunc =
140       Function::Create(getCheckFunctionType(Ctx), GlobalValue::ExternalLinkage,
141                        DefaultCheckFunctionName, &M);
142   DefaultCheckFunc->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
143   DefaultCheckFunc->addParamAttr(0, Attribute::NoUndef);
144   if (UseX86FastCall)
145     DefaultCheckFunc->addParamAttr(0, Attribute::InReg);
146 
147   BasicBlock *EntryBB = BasicBlock::Create(Ctx, "", DefaultCheckFunc);
148   ReturnInst::Create(Ctx, EntryBB);
149   return DefaultCheckFunc;
150 }
151 } // namespace
152 
runImpl(Module & M)153 bool runImpl(Module &M) {
154   bool Changed = false;
155   LLVMContext &Ctx = M.getContext();
156   Triple ModuleTriple(M.getTargetTriple());
157   bool IsMSVC = ModuleTriple.isKnownWindowsMSVCEnvironment();
158   bool IsELF = ModuleTriple.isOSBinFormatELF();
159   assert((IsELF || IsMSVC) && "Unsupported triple for JMC");
160   bool UseX86FastCall = IsMSVC && ModuleTriple.getArch() == Triple::x86;
161   const char *const FlagSymbolSection = IsELF ? ".data.just.my.code" : ".msvcjmc";
162 
163   GlobalValue *CheckFunction = nullptr;
164   DenseMap<DISubprogram *, Constant *> SavedFlags(8);
165   for (auto &F : M) {
166     if (F.isDeclaration())
167       continue;
168     auto *SP = F.getSubprogram();
169     if (!SP)
170       continue;
171 
172     Constant *&Flag = SavedFlags[SP];
173     if (!Flag) {
174       std::string FlagName = getFlagName(*SP, UseX86FastCall);
175       IntegerType *FlagTy = Type::getInt8Ty(Ctx);
176       Flag = M.getOrInsertGlobal(FlagName, FlagTy, [&] {
177         // FIXME: Put the GV in comdat and have linkonce_odr linkage to save
178         //        .msvcjmc section space? maybe not worth it.
179         GlobalVariable *GV = new GlobalVariable(
180             M, FlagTy, /*isConstant=*/false, GlobalValue::InternalLinkage,
181             ConstantInt::get(FlagTy, 1), FlagName);
182         GV->setSection(FlagSymbolSection);
183         GV->setAlignment(Align(1));
184         GV->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
185         attachDebugInfo(*GV, *SP);
186         return GV;
187       });
188     }
189 
190     if (!CheckFunction) {
191       Function *DefaultCheckFunc =
192           createDefaultCheckFunction(M, UseX86FastCall);
193       if (IsELF) {
194         DefaultCheckFunc->setName(CheckFunctionName);
195         DefaultCheckFunc->setLinkage(GlobalValue::WeakAnyLinkage);
196         CheckFunction = DefaultCheckFunc;
197       } else {
198         assert(!M.getFunction(CheckFunctionName) &&
199                "JMC instrument more than once?");
200         auto *CheckFunc = cast<Function>(
201             M.getOrInsertFunction(CheckFunctionName, getCheckFunctionType(Ctx))
202                 .getCallee());
203         CheckFunc->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
204         CheckFunc->addParamAttr(0, Attribute::NoUndef);
205         if (UseX86FastCall) {
206           CheckFunc->setCallingConv(CallingConv::X86_FastCall);
207           CheckFunc->addParamAttr(0, Attribute::InReg);
208         }
209         CheckFunction = CheckFunc;
210 
211         StringRef DefaultCheckFunctionName = DefaultCheckFunc->getName();
212         appendToUsed(M, {DefaultCheckFunc});
213         Comdat *C = M.getOrInsertComdat(DefaultCheckFunctionName);
214         C->setSelectionKind(Comdat::Any);
215         DefaultCheckFunc->setComdat(C);
216         // Add a linker option /alternatename to set the default implementation
217         // for the check function.
218         // https://devblogs.microsoft.com/oldnewthing/20200731-00/?p=104024
219         std::string AltOption = std::string("/alternatename:") +
220                                 CheckFunctionName + "=" +
221                                 DefaultCheckFunctionName.str();
222         llvm::Metadata *Ops[] = {llvm::MDString::get(Ctx, AltOption)};
223         MDTuple *N = MDNode::get(Ctx, Ops);
224         M.getOrInsertNamedMetadata("llvm.linker.options")->addOperand(N);
225       }
226     }
227     // FIXME: it would be nice to make CI scheduling boundary, although in
228     //        practice it does not matter much.
229     auto *CI = CallInst::Create(getCheckFunctionType(Ctx), CheckFunction,
230                                 {Flag}, "", F.begin()->getFirstInsertionPt());
231     CI->addParamAttr(0, Attribute::NoUndef);
232     if (UseX86FastCall) {
233       CI->setCallingConv(CallingConv::X86_FastCall);
234       CI->addParamAttr(0, Attribute::InReg);
235     }
236 
237     Changed = true;
238   }
239   return Changed;
240 }
241