1 /****************************************************************************
2  * Copyright (C) 2014-2018 Intel Corporation.   All Rights Reserved.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  *
23  * @file JitManager.cpp
24  *
25  * @brief Implementation if the Jit Manager.
26  *
27  * Notes:
28  *
29  ******************************************************************************/
30 #include "jit_pch.hpp"
31 
32 #include "JitManager.h"
33 #include "jit_api.h"
34 #include "fetch_jit.h"
35 
36 #include "core/state.h"
37 
38 #include "gen_state_llvm.h"
39 
40 #include <sstream>
41 #if defined(_WIN32)
42 #include <psapi.h>
43 #include <cstring>
44 
45 #define INTEL_OUTPUT_DIR "c:\\Intel"
46 #define SWR_OUTPUT_DIR INTEL_OUTPUT_DIR "\\SWR"
47 #define JITTER_OUTPUT_DIR SWR_OUTPUT_DIR "\\Jitter"
48 #endif // _WIN32
49 
50 #if defined(__APPLE__) || defined(FORCE_LINUX) || defined(__linux__) || defined(__gnu_linux__)
51 #include <pwd.h>
52 #include <sys/stat.h>
53 #endif
54 
55 
56 using namespace llvm;
57 using namespace SwrJit;
58 
59 //////////////////////////////////////////////////////////////////////////
60 /// @brief Contructor for JitManager.
61 /// @param simdWidth - SIMD width to be used in generated program.
JitManager(uint32_t simdWidth,const char * arch,const char * core)62 JitManager::JitManager(uint32_t simdWidth, const char* arch, const char* core) :
63     mContext(), mBuilder(mContext), mIsModuleFinalized(true), mJitNumber(0), mVWidth(simdWidth),
64     mArch(arch)
65 {
66     mpCurrentModule = nullptr;
67     mpExec          = nullptr;
68 
69     InitializeNativeTarget();
70     InitializeNativeTargetAsmPrinter();
71     InitializeNativeTargetDisassembler();
72 
73 
74     // force JIT to use the same CPU arch as the rest of swr
75     if (mArch.AVX512F())
76     {
77 #if USE_SIMD16_SHADERS
78         if (mArch.AVX512ER())
79         {
80             mHostCpuName = StringRef("knl");
81         }
82         else
83         {
84             mHostCpuName = StringRef("skylake-avx512");
85         }
86         mUsingAVX512 = true;
87 #else
88         mHostCpuName = StringRef("core-avx2");
89 #endif
90         if (mVWidth == 0)
91         {
92             mVWidth = 8;
93         }
94     }
95     else if (mArch.AVX2())
96     {
97         mHostCpuName = StringRef("core-avx2");
98         if (mVWidth == 0)
99         {
100             mVWidth = 8;
101         }
102     }
103     else if (mArch.AVX())
104     {
105         if (mArch.F16C())
106         {
107             mHostCpuName = StringRef("core-avx-i");
108         }
109         else
110         {
111             mHostCpuName = StringRef("corei7-avx");
112         }
113         if (mVWidth == 0)
114         {
115             mVWidth = 8;
116         }
117     }
118     else
119     {
120         SWR_INVALID("Jitting requires at least AVX ISA support");
121     }
122 
123 
124     mOptLevel = CodeGenOpt::Aggressive;
125 
126     if (KNOB_JIT_OPTIMIZATION_LEVEL >= CodeGenOpt::None &&
127         KNOB_JIT_OPTIMIZATION_LEVEL <= CodeGenOpt::Aggressive)
128     {
129         mOptLevel = CodeGenOpt::Level(KNOB_JIT_OPTIMIZATION_LEVEL);
130     }
131 
132     if (KNOB_JIT_ENABLE_CACHE)
133     {
134         mCache.Init(this, mHostCpuName, mOptLevel);
135     }
136 
137     SetupNewModule();
138     mIsModuleFinalized = true;
139 
140     // fetch function signature
141 #if USE_SIMD16_SHADERS
142     // typedef void(__cdecl *PFN_FETCH_FUNC)(SWR_FETCH_CONTEXT& fetchInfo, simd16vertex& out);
143 #else
144     // typedef void(__cdecl *PFN_FETCH_FUNC)(SWR_FETCH_CONTEXT& fetchInfo, simdvertex& out);
145 #endif
146     std::vector<Type*> fsArgs;
147 
148     // llvm5 is picky and does not take a void * type
149     fsArgs.push_back(PointerType::get(Gen_SWR_FETCH_CONTEXT(this), 0));
150 
151     fsArgs.push_back(Type::getInt8PtrTy(mContext));
152 
153     fsArgs.push_back(PointerType::get(Gen_SWR_FETCH_CONTEXT(this), 0));
154 #if USE_SIMD16_SHADERS
155     fsArgs.push_back(PointerType::get(Gen_simd16vertex(this), 0));
156 #else
157     fsArgs.push_back(PointerType::get(Gen_simdvertex(this), 0));
158 #endif
159 
160     mFetchShaderTy = FunctionType::get(Type::getVoidTy(mContext), fsArgs, false);
161 
162 #if defined(_MSC_VER)
163     // explicitly instantiate used symbols from potentially staticly linked libs
164     sys::DynamicLibrary::AddSymbol("exp2f", &exp2f);
165     sys::DynamicLibrary::AddSymbol("log2f", &log2f);
166     sys::DynamicLibrary::AddSymbol("sinf", &sinf);
167     sys::DynamicLibrary::AddSymbol("cosf", &cosf);
168     sys::DynamicLibrary::AddSymbol("powf", &powf);
169 #endif
170 
171 #if defined(_WIN32)
172     if (KNOB_DUMP_SHADER_IR)
173     {
174         CreateDirectoryPath(INTEL_OUTPUT_DIR);
175         CreateDirectoryPath(SWR_OUTPUT_DIR);
176         CreateDirectoryPath(JITTER_OUTPUT_DIR);
177     }
178 #endif
179 }
180 
CreateExecEngine(std::unique_ptr<Module> pModule)181 void JitManager::CreateExecEngine(std::unique_ptr<Module> pModule)
182 {
183     TargetOptions tOpts;
184     tOpts.AllowFPOpFusion = FPOpFusion::Fast;
185     tOpts.NoInfsFPMath    = false;
186     tOpts.NoNaNsFPMath    = false;
187     tOpts.UnsafeFPMath = false;
188 
189     // tOpts.PrintMachineCode    = true;
190 
191     mpExec = EngineBuilder(std::move(pModule))
192                  .setTargetOptions(tOpts)
193                  .setOptLevel(mOptLevel)
194                  .setMCPU(mHostCpuName)
195                  .create();
196 
197     if (KNOB_JIT_ENABLE_CACHE)
198     {
199         mpExec->setObjectCache(&mCache);
200     }
201 
202 #if LLVM_USE_INTEL_JITEVENTS
203     JITEventListener* vTune = JITEventListener::createIntelJITEventListener();
204     mpExec->RegisterJITEventListener(vTune);
205 #endif
206 
207     mvExecEngines.push_back(mpExec);
208 }
209 
210 //////////////////////////////////////////////////////////////////////////
211 /// @brief Create new LLVM module.
SetupNewModule()212 void JitManager::SetupNewModule()
213 {
214     SWR_ASSERT(mIsModuleFinalized == true && "Current module is not finalized!");
215 
216     std::unique_ptr<Module> newModule(new Module("", mContext));
217     mpCurrentModule = newModule.get();
218     mpCurrentModule->setTargetTriple(sys::getProcessTriple());
219     CreateExecEngine(std::move(newModule));
220     mIsModuleFinalized = false;
221 }
222 
223 
224 DIType*
CreateDebugStructType(StructType * pType,const std::string & name,DIFile * pFile,uint32_t lineNum,const std::vector<std::pair<std::string,uint32_t>> & members)225 JitManager::CreateDebugStructType(StructType*                                          pType,
226                                   const std::string&                                   name,
227                                   DIFile*                                              pFile,
228                                   uint32_t                                             lineNum,
229                                   const std::vector<std::pair<std::string, uint32_t>>& members)
230 {
231     DIBuilder                 builder(*mpCurrentModule);
232     SmallVector<Metadata*, 8> ElemTypes;
233     DataLayout                DL        = DataLayout(mpCurrentModule);
234     uint32_t                  size      = DL.getTypeAllocSizeInBits(pType);
235     uint32_t                  alignment = DL.getABITypeAlignment(pType);
236     DINode::DIFlags           flags     = DINode::DIFlags::FlagPublic;
237 
238     DICompositeType* pDIStructTy = builder.createStructType(pFile,
239                                                             name,
240                                                             pFile,
241                                                             lineNum,
242                                                             size,
243                                                             alignment,
244                                                             flags,
245                                                             nullptr,
246                                                             builder.getOrCreateArray(ElemTypes));
247 
248     // Register mapping now to break loops (in case struct contains itself or pointers to itself)
249     mDebugStructMap[pType] = pDIStructTy;
250 
251     uint32_t idx = 0;
252     for (auto& elem : pType->elements())
253     {
254         std::string name       = members[idx].first;
255         uint32_t    lineNum    = members[idx].second;
256         size                   = DL.getTypeAllocSizeInBits(elem);
257         alignment              = DL.getABITypeAlignment(elem);
258         uint32_t      offset   = DL.getStructLayout(pType)->getElementOffsetInBits(idx);
259         llvm::DIType* pDebugTy = GetDebugType(elem);
260         ElemTypes.push_back(builder.createMemberType(
261             pDIStructTy, name, pFile, lineNum, size, alignment, offset, flags, pDebugTy));
262 
263         idx++;
264     }
265 
266     pDIStructTy->replaceElements(builder.getOrCreateArray(ElemTypes));
267     return pDIStructTy;
268 }
269 
GetDebugArrayType(Type * pTy)270 DIType* JitManager::GetDebugArrayType(Type* pTy)
271 {
272     DIBuilder  builder(*mpCurrentModule);
273     DataLayout DL        = DataLayout(mpCurrentModule);
274     ArrayType* pArrayTy  = cast<ArrayType>(pTy);
275     uint32_t   size      = DL.getTypeAllocSizeInBits(pArrayTy);
276     uint32_t   alignment = DL.getABITypeAlignment(pArrayTy);
277 
278     SmallVector<Metadata*, 8> Elems;
279     Elems.push_back(builder.getOrCreateSubrange(0, pArrayTy->getNumElements()));
280     return builder.createArrayType(
281         size, alignment, GetDebugType(pArrayTy->getElementType()), builder.getOrCreateArray(Elems));
282 }
283 
284 // Create a DIType from llvm Type
GetDebugType(Type * pTy)285 DIType* JitManager::GetDebugType(Type* pTy)
286 {
287     DIBuilder    builder(*mpCurrentModule);
288     Type::TypeID id = pTy->getTypeID();
289 
290     switch (id)
291     {
292     case Type::VoidTyID:
293         return builder.createUnspecifiedType("void");
294         break;
295     case Type::HalfTyID:
296         return builder.createBasicType("float16", 16, dwarf::DW_ATE_float);
297         break;
298     case Type::FloatTyID:
299         return builder.createBasicType("float", 32, dwarf::DW_ATE_float);
300         break;
301     case Type::DoubleTyID:
302         return builder.createBasicType("double", 64, dwarf::DW_ATE_float);
303         break;
304     case Type::IntegerTyID:
305         return GetDebugIntegerType(pTy);
306         break;
307     case Type::StructTyID:
308         return GetDebugStructType(pTy);
309         break;
310     case Type::ArrayTyID:
311         return GetDebugArrayType(pTy);
312         break;
313     case Type::PointerTyID:
314         return builder.createPointerType(GetDebugType(pTy->getPointerElementType()), 64, 64);
315         break;
316 #if LLVM_VERSION_MAJOR >= 11
317     case Type::FixedVectorTyID:
318 #else
319     case Type::VectorTyID:
320 #endif
321         return GetDebugVectorType(pTy);
322         break;
323     case Type::FunctionTyID:
324         return GetDebugFunctionType(pTy);
325         break;
326     default:
327         SWR_ASSERT(false, "Unimplemented llvm type");
328     }
329     return nullptr;
330 }
331 
332 // Create a DISubroutineType from an llvm FunctionType
GetDebugFunctionType(Type * pTy)333 DIType* JitManager::GetDebugFunctionType(Type* pTy)
334 {
335     SmallVector<Metadata*, 8> ElemTypes;
336     FunctionType*             pFuncTy = cast<FunctionType>(pTy);
337     DIBuilder                 builder(*mpCurrentModule);
338 
339     // Add result type
340     ElemTypes.push_back(GetDebugType(pFuncTy->getReturnType()));
341 
342     // Add arguments
343     for (auto& param : pFuncTy->params())
344     {
345         ElemTypes.push_back(GetDebugType(param));
346     }
347 
348     return builder.createSubroutineType(builder.getOrCreateTypeArray(ElemTypes));
349 }
350 
GetDebugIntegerType(Type * pTy)351 DIType* JitManager::GetDebugIntegerType(Type* pTy)
352 {
353     DIBuilder    builder(*mpCurrentModule);
354     IntegerType* pIntTy = cast<IntegerType>(pTy);
355     switch (pIntTy->getBitWidth())
356     {
357     case 1:
358         return builder.createBasicType("int1", 1, dwarf::DW_ATE_unsigned);
359         break;
360     case 8:
361         return builder.createBasicType("int8", 8, dwarf::DW_ATE_signed);
362         break;
363     case 16:
364         return builder.createBasicType("int16", 16, dwarf::DW_ATE_signed);
365         break;
366     case 32:
367         return builder.createBasicType("int", 32, dwarf::DW_ATE_signed);
368         break;
369     case 64:
370         return builder.createBasicType("int64", 64, dwarf::DW_ATE_signed);
371         break;
372     case 128:
373         return builder.createBasicType("int128", 128, dwarf::DW_ATE_signed);
374         break;
375     default:
376         SWR_ASSERT(false, "Unimplemented integer bit width");
377     }
378     return nullptr;
379 }
380 
GetDebugVectorType(Type * pTy)381 DIType* JitManager::GetDebugVectorType(Type* pTy)
382 {
383     DIBuilder                 builder(*mpCurrentModule);
384     VectorType*               pVecTy    = cast<VectorType>(pTy);
385     DataLayout                DL        = DataLayout(mpCurrentModule);
386     uint32_t                  size      = DL.getTypeAllocSizeInBits(pVecTy);
387     uint32_t                  alignment = DL.getABITypeAlignment(pVecTy);
388     SmallVector<Metadata*, 1> Elems;
389 
390 #if LLVM_VERSION_MAJOR >= 11
391     Elems.push_back(builder.getOrCreateSubrange(0, pVecTy->getNumElements()));
392 #else
393     Elems.push_back(builder.getOrCreateSubrange(0, pVecTy->getVectorNumElements()));
394 #endif
395 
396     return builder.createVectorType(size,
397                                     alignment,
398 #if LLVM_VERSION_MAJOR >= 11
399                                     GetDebugType(pVecTy->getElementType()),
400 #else
401                                     GetDebugType(pVecTy->getVectorElementType()),
402 #endif
403                                     builder.getOrCreateArray(Elems));
404 }
405 
406 //////////////////////////////////////////////////////////////////////////
407 /// @brief Dump function x86 assembly to file.
408 /// @note This should only be called after the module has been jitted to x86 and the
409 ///       module will not be further accessed.
DumpAsm(Function * pFunction,const char * fileName)410 void JitManager::DumpAsm(Function* pFunction, const char* fileName)
411 {
412     if (KNOB_DUMP_SHADER_IR)
413     {
414 #if defined(_WIN32)
415         DWORD pid = GetCurrentProcessId();
416         char  procname[MAX_PATH];
417         GetModuleFileNameA(NULL, procname, MAX_PATH);
418         const char*       pBaseName = strrchr(procname, '\\');
419         std::stringstream outDir;
420         outDir << JITTER_OUTPUT_DIR << pBaseName << "_" << pid << std::ends;
421         CreateDirectoryPath(outDir.str().c_str());
422 #endif
423 
424         std::error_code EC;
425         Module*         pModule  = pFunction->getParent();
426         const char*     funcName = pFunction->getName().data();
427         char            fName[256];
428 #if defined(_WIN32)
429         sprintf(fName, "%s\\%s.%s.asm", outDir.str().c_str(), funcName, fileName);
430 #else
431         sprintf(fName, "%s.%s.asm", funcName, fileName);
432 #endif
433 
434         raw_fd_ostream filestream(fName, EC, llvm::sys::fs::F_None);
435 
436         legacy::PassManager* pMPasses         = new legacy::PassManager();
437         auto*                pTarget          = mpExec->getTargetMachine();
438         pTarget->Options.MCOptions.AsmVerbose = true;
439 #if LLVM_VERSION_MAJOR >= 10
440         pTarget->addPassesToEmitFile(
441             *pMPasses, filestream, nullptr, CGFT_AssemblyFile);
442 #elif LLVM_VERSION_MAJOR >= 7
443         pTarget->addPassesToEmitFile(
444             *pMPasses, filestream, nullptr, TargetMachine::CGFT_AssemblyFile);
445 #else
446         pTarget->addPassesToEmitFile(*pMPasses, filestream, TargetMachine::CGFT_AssemblyFile);
447 #endif
448         pMPasses->run(*pModule);
449         delete pMPasses;
450         pTarget->Options.MCOptions.AsmVerbose = false;
451     }
452 }
453 
GetOutputDir()454 std::string JitManager::GetOutputDir()
455 {
456 #if defined(_WIN32)
457     DWORD pid = GetCurrentProcessId();
458     char  procname[MAX_PATH];
459     GetModuleFileNameA(NULL, procname, MAX_PATH);
460     const char*       pBaseName = strrchr(procname, '\\');
461     std::stringstream outDir;
462     outDir << JITTER_OUTPUT_DIR << pBaseName << "_" << pid;
463     CreateDirectoryPath(outDir.str().c_str());
464     return outDir.str();
465 #endif
466     return "";
467 }
468 
469 //////////////////////////////////////////////////////////////////////////
470 /// @brief Dump function to file.
DumpToFile(Module * M,const char * fileName,llvm::AssemblyAnnotationWriter * annotater)471 void JitManager::DumpToFile(Module*                         M,
472                             const char*                     fileName,
473                             llvm::AssemblyAnnotationWriter* annotater)
474 {
475     if (KNOB_DUMP_SHADER_IR)
476     {
477         std::string outDir = GetOutputDir();
478 
479         std::error_code EC;
480         const char*     funcName = M->getName().data();
481         char            fName[256];
482 #if defined(_WIN32)
483         sprintf(fName, "%s\\%s.%s.ll", outDir.c_str(), funcName, fileName);
484 #else
485         sprintf(fName, "%s.%s.ll", funcName, fileName);
486 #endif
487         raw_fd_ostream fd(fName, EC, llvm::sys::fs::F_None);
488         M->print(fd, annotater);
489         fd.flush();
490     }
491 }
492 
493 //////////////////////////////////////////////////////////////////////////
494 /// @brief Dump function to file.
DumpToFile(Function * f,const char * fileName)495 void JitManager::DumpToFile(Function* f, const char* fileName)
496 {
497     if (KNOB_DUMP_SHADER_IR)
498     {
499         std::string outDir = GetOutputDir();
500 
501         std::error_code EC;
502         const char*     funcName = f->getName().data();
503         char            fName[256];
504 #if defined(_WIN32)
505         sprintf(fName, "%s\\%s.%s.ll", outDir.c_str(), funcName, fileName);
506 #else
507         sprintf(fName, "%s.%s.ll", funcName, fileName);
508 #endif
509         raw_fd_ostream fd(fName, EC, llvm::sys::fs::F_None);
510         f->print(fd, nullptr);
511 
512 #if defined(_WIN32)
513         sprintf(fName, "%s\\cfg.%s.%s.dot", outDir.c_str(), funcName, fileName);
514 #else
515         sprintf(fName, "cfg.%s.%s.dot", funcName, fileName);
516 #endif
517         fd.flush();
518 
519         raw_fd_ostream fd_cfg(fName, EC, llvm::sys::fs::F_Text);
520         WriteGraph(fd_cfg, (const Function*)f);
521 
522         fd_cfg.flush();
523     }
524 }
525 
526 extern "C" {
527 bool g_DllActive = true;
528 
529 //////////////////////////////////////////////////////////////////////////
530 /// @brief Create JIT context.
531 /// @param simdWidth - SIMD width to be used in generated program.
JitCreateContext(uint32_t targetSimdWidth,const char * arch,const char * core)532 HANDLE JITCALL JitCreateContext(uint32_t targetSimdWidth, const char* arch, const char* core)
533 {
534     return new JitManager(targetSimdWidth, arch, core);
535 }
536 
537 //////////////////////////////////////////////////////////////////////////
538 /// @brief Destroy JIT context.
JitDestroyContext(HANDLE hJitContext)539 void JITCALL JitDestroyContext(HANDLE hJitContext)
540 {
541     if (g_DllActive)
542     {
543         delete reinterpret_cast<JitManager*>(hJitContext);
544     }
545 }
546 }
547 
548 //////////////////////////////////////////////////////////////////////////
549 /// JitCache
550 //////////////////////////////////////////////////////////////////////////
551 
552 //////////////////////////////////////////////////////////////////////////
553 /// JitCacheFileHeader
554 //////////////////////////////////////////////////////////////////////////
555 struct JitCacheFileHeader
556 {
InitJitCacheFileHeader557     void Init(uint32_t           llCRC,
558               uint32_t           objCRC,
559               const std::string& moduleID,
560               const std::string& cpu,
561               uint32_t           optLevel,
562               uint64_t           objSize)
563     {
564         m_objSize = objSize;
565         m_llCRC   = llCRC;
566         m_objCRC  = objCRC;
567         strncpy(m_ModuleID, moduleID.c_str(), JC_STR_MAX_LEN - 1);
568         m_ModuleID[JC_STR_MAX_LEN - 1] = 0;
569         strncpy(m_Cpu, cpu.c_str(), JC_STR_MAX_LEN - 1);
570         m_Cpu[JC_STR_MAX_LEN - 1] = 0;
571         m_optLevel                = optLevel;
572     }
573 
574 
575     bool
IsValidJitCacheFileHeader576     IsValid(uint32_t llCRC, const std::string& moduleID, const std::string& cpu, uint32_t optLevel)
577     {
578         if ((m_MagicNumber != JC_MAGIC_NUMBER) || (m_llCRC != llCRC) ||
579             (m_platformKey != JC_PLATFORM_KEY) || (m_optLevel != optLevel))
580         {
581             return false;
582         }
583 
584         m_ModuleID[JC_STR_MAX_LEN - 1] = 0;
585         if (strncmp(moduleID.c_str(), m_ModuleID, JC_STR_MAX_LEN - 1))
586         {
587             return false;
588         }
589 
590         m_Cpu[JC_STR_MAX_LEN - 1] = 0;
591         if (strncmp(cpu.c_str(), m_Cpu, JC_STR_MAX_LEN - 1))
592         {
593             return false;
594         }
595 
596         return true;
597     }
598 
GetObjectSizeJitCacheFileHeader599     uint64_t GetObjectSize() const { return m_objSize; }
GetObjectCRCJitCacheFileHeader600     uint64_t GetObjectCRC() const { return m_objCRC; }
601 
602 private:
603     static const uint64_t JC_MAGIC_NUMBER = 0xfedcba9876543210ULL + 7;
604     static const size_t   JC_STR_MAX_LEN  = 32;
605     static const uint32_t JC_PLATFORM_KEY = (LLVM_VERSION_MAJOR << 24) |
606                                             (LLVM_VERSION_MINOR << 16) | (LLVM_VERSION_PATCH << 8) |
607                                             ((sizeof(void*) > sizeof(uint32_t)) ? 1 : 0);
608 
609     uint64_t m_MagicNumber              = JC_MAGIC_NUMBER;
610     uint64_t m_objSize                  = 0;
611     uint32_t m_llCRC                    = 0;
612     uint32_t m_platformKey              = JC_PLATFORM_KEY;
613     uint32_t m_objCRC                   = 0;
614     uint32_t m_optLevel                 = 0;
615     char     m_ModuleID[JC_STR_MAX_LEN] = {};
616     char     m_Cpu[JC_STR_MAX_LEN]      = {};
617 };
618 
ComputeModuleCRC(const llvm::Module * M)619 static inline uint32_t ComputeModuleCRC(const llvm::Module* M)
620 {
621     std::string        bitcodeBuffer;
622     raw_string_ostream bitcodeStream(bitcodeBuffer);
623 
624 #if LLVM_VERSION_MAJOR >= 7
625     llvm::WriteBitcodeToFile(*M, bitcodeStream);
626 #else
627     llvm::WriteBitcodeToFile(M, bitcodeStream);
628 #endif
629     // M->print(bitcodeStream, nullptr, false);
630 
631     bitcodeStream.flush();
632 
633     return ComputeCRC(0, bitcodeBuffer.data(), bitcodeBuffer.size());
634 }
635 
636 /// constructor
JitCache()637 JitCache::JitCache()
638 {
639 #if defined(__APPLE__) || defined(FORCE_LINUX) || defined(__linux__) || defined(__gnu_linux__)
640     if (strncmp(KNOB_JIT_CACHE_DIR.c_str(), "~/", 2) == 0)
641     {
642         char* homedir;
643         if (!(homedir = getenv("HOME")))
644         {
645             homedir = getpwuid(getuid())->pw_dir;
646         }
647         mCacheDir = homedir;
648         mCacheDir += (KNOB_JIT_CACHE_DIR.c_str() + 1);
649     }
650     else
651 #endif
652     {
653         mCacheDir = KNOB_JIT_CACHE_DIR;
654     }
655 
656     // Create cache dir at startup to allow jitter to write debug.ll files
657     // to that directory.
658     if (!llvm::sys::fs::exists(mCacheDir.str()) &&
659         llvm::sys::fs::create_directories(mCacheDir.str()))
660     {
661         SWR_INVALID("Unable to create directory: %s", mCacheDir.c_str());
662     }
663 
664 }
665 
ExecUnhookedProcess(const std::string & CmdLine,std::string * pStdOut,std::string * pStdErr)666 int ExecUnhookedProcess(const std::string& CmdLine, std::string* pStdOut, std::string* pStdErr)
667 {
668 
669     return ExecCmd(CmdLine, nullptr, pStdOut, pStdErr);
670 }
671 
672 /// Calculate actual directory where module will be cached.
673 /// This is always a subdirectory of mCacheDir.  Full absolute
674 /// path name will be stored in mCurrentModuleCacheDir
CalcModuleCacheDir()675 void JitCache::CalcModuleCacheDir()
676 {
677     mModuleCacheDir.clear();
678 
679     llvm::SmallString<MAX_PATH> moduleDir = mCacheDir;
680 
681     // Create 4 levels of directory hierarchy based on CRC, 256 entries each
682     uint8_t* pCRC = (uint8_t*)&mCurrentModuleCRC;
683     for (uint32_t i = 0; i < 4; ++i)
684     {
685         llvm::sys::path::append(moduleDir, std::to_string((int)pCRC[i]));
686     }
687 
688     mModuleCacheDir = moduleDir;
689 }
690 
691 /// notifyObjectCompiled - Provides a pointer to compiled code for Module M.
notifyObjectCompiled(const llvm::Module * M,llvm::MemoryBufferRef Obj)692 void JitCache::notifyObjectCompiled(const llvm::Module* M, llvm::MemoryBufferRef Obj)
693 {
694     const std::string& moduleID = M->getModuleIdentifier();
695     if (!moduleID.length())
696     {
697         return;
698     }
699 
700     if (!mModuleCacheDir.size())
701     {
702         SWR_INVALID("Unset module cache directory");
703         return;
704     }
705 
706     if (!llvm::sys::fs::exists(mModuleCacheDir.str()) &&
707         llvm::sys::fs::create_directories(mModuleCacheDir.str()))
708     {
709         SWR_INVALID("Unable to create directory: %s", mModuleCacheDir.c_str());
710         return;
711     }
712 
713     JitCacheFileHeader header;
714 
715     llvm::SmallString<MAX_PATH> filePath = mModuleCacheDir;
716     llvm::sys::path::append(filePath, moduleID);
717 
718     llvm::SmallString<MAX_PATH> objPath = filePath;
719     objPath += JIT_OBJ_EXT;
720 
721     {
722         std::error_code      err;
723         llvm::raw_fd_ostream fileObj(objPath.c_str(), err, llvm::sys::fs::F_None);
724         fileObj << Obj.getBuffer();
725         fileObj.flush();
726     }
727 
728 
729     {
730         std::error_code      err;
731         llvm::raw_fd_ostream fileObj(filePath.c_str(), err, llvm::sys::fs::F_None);
732 
733         uint32_t objcrc = ComputeCRC(0, Obj.getBufferStart(), Obj.getBufferSize());
734 
735         header.Init(mCurrentModuleCRC, objcrc, moduleID, mCpu, mOptLevel, Obj.getBufferSize());
736 
737         fileObj.write((const char*)&header, sizeof(header));
738         fileObj.flush();
739     }
740 }
741 
742 /// Returns a pointer to a newly allocated MemoryBuffer that contains the
743 /// object which corresponds with Module M, or 0 if an object is not
744 /// available.
getObject(const llvm::Module * M)745 std::unique_ptr<llvm::MemoryBuffer> JitCache::getObject(const llvm::Module* M)
746 {
747     const std::string& moduleID = M->getModuleIdentifier();
748     mCurrentModuleCRC           = ComputeModuleCRC(M);
749 
750     if (!moduleID.length())
751     {
752         return nullptr;
753     }
754 
755     CalcModuleCacheDir();
756 
757     if (!llvm::sys::fs::exists(mModuleCacheDir))
758     {
759         return nullptr;
760     }
761 
762     llvm::SmallString<MAX_PATH> filePath = mModuleCacheDir;
763     llvm::sys::path::append(filePath, moduleID);
764 
765     llvm::SmallString<MAX_PATH> objFilePath = filePath;
766     objFilePath += JIT_OBJ_EXT;
767 
768     FILE* fpObjIn = nullptr;
769     FILE* fpIn    = fopen(filePath.c_str(), "rb");
770     if (!fpIn)
771     {
772         return nullptr;
773     }
774 
775     std::unique_ptr<llvm::MemoryBuffer> pBuf = nullptr;
776     do
777     {
778         JitCacheFileHeader header;
779         if (!fread(&header, sizeof(header), 1, fpIn))
780         {
781             break;
782         }
783 
784         if (!header.IsValid(mCurrentModuleCRC, moduleID, mCpu, mOptLevel))
785         {
786             break;
787         }
788 
789         fpObjIn = fopen(objFilePath.c_str(), "rb");
790         if (!fpObjIn)
791         {
792             break;
793         }
794 
795 #if LLVM_VERSION_MAJOR < 6
796         pBuf = llvm::MemoryBuffer::getNewUninitMemBuffer(size_t(header.GetObjectSize()));
797 #else
798         pBuf = llvm::WritableMemoryBuffer::getNewUninitMemBuffer(size_t(header.GetObjectSize()));
799 #endif
800         if (!fread(const_cast<char*>(pBuf->getBufferStart()), header.GetObjectSize(), 1, fpObjIn))
801         {
802             pBuf = nullptr;
803             break;
804         }
805 
806         if (header.GetObjectCRC() != ComputeCRC(0, pBuf->getBufferStart(), pBuf->getBufferSize()))
807         {
808             SWR_TRACE("Invalid object cache file, ignoring: %s", filePath.c_str());
809             pBuf = nullptr;
810             break;
811         }
812 
813     } while (0);
814 
815     fclose(fpIn);
816 
817     if (fpObjIn)
818     {
819         fclose(fpObjIn);
820     }
821 
822 
823     return pBuf;
824 }
825 
emitInstructionAnnot(const llvm::Instruction * pInst,llvm::formatted_raw_ostream & OS)826 void InterleaveAssemblyAnnotater::emitInstructionAnnot(const llvm::Instruction*     pInst,
827                                                        llvm::formatted_raw_ostream& OS)
828 {
829     auto dbgLoc = pInst->getDebugLoc();
830     if (dbgLoc)
831     {
832         unsigned int line = dbgLoc.getLine();
833         if (line != mCurrentLineNo)
834         {
835             if (line > 0 && line <= mAssembly.size())
836             {
837                 // HACK: here we assume that OS is a formatted_raw_ostream(ods())
838                 // and modify the color accordingly. We can't do the color
839                 // modification on OS because formatted_raw_ostream strips
840                 // the color information. The only way to fix this behavior
841                 // is to patch LLVM.
842                 OS << "\n; " << line << ": " << mAssembly[line - 1] << "\n";
843             }
844             mCurrentLineNo = line;
845         }
846     }
847 }
848