1 /****************************************************************************
2 * Copyright (C) 2014-2018 Intel Corporation. All Rights Reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * @file JitManager.cpp
24 *
25 * @brief Implementation if the Jit Manager.
26 *
27 * Notes:
28 *
29 ******************************************************************************/
30 #include "jit_pch.hpp"
31
32 #include "JitManager.h"
33 #include "jit_api.h"
34 #include "fetch_jit.h"
35
36 #include "core/state.h"
37
38 #include "gen_state_llvm.h"
39
40 #include <sstream>
41 #if defined(_WIN32)
42 #include <psapi.h>
43 #include <cstring>
44
45 #define INTEL_OUTPUT_DIR "c:\\Intel"
46 #define SWR_OUTPUT_DIR INTEL_OUTPUT_DIR "\\SWR"
47 #define JITTER_OUTPUT_DIR SWR_OUTPUT_DIR "\\Jitter"
48 #endif // _WIN32
49
50 #if defined(__APPLE__) || defined(FORCE_LINUX) || defined(__linux__) || defined(__gnu_linux__)
51 #include <pwd.h>
52 #include <sys/stat.h>
53 #endif
54
55
56 using namespace llvm;
57 using namespace SwrJit;
58
59 //////////////////////////////////////////////////////////////////////////
60 /// @brief Contructor for JitManager.
61 /// @param simdWidth - SIMD width to be used in generated program.
JitManager(uint32_t simdWidth,const char * arch,const char * core)62 JitManager::JitManager(uint32_t simdWidth, const char* arch, const char* core) :
63 mContext(), mBuilder(mContext), mIsModuleFinalized(true), mJitNumber(0), mVWidth(simdWidth),
64 mArch(arch)
65 {
66 mpCurrentModule = nullptr;
67 mpExec = nullptr;
68
69 InitializeNativeTarget();
70 InitializeNativeTargetAsmPrinter();
71 InitializeNativeTargetDisassembler();
72
73
74 // force JIT to use the same CPU arch as the rest of swr
75 if (mArch.AVX512F())
76 {
77 #if USE_SIMD16_SHADERS
78 if (mArch.AVX512ER())
79 {
80 mHostCpuName = StringRef("knl");
81 }
82 else
83 {
84 mHostCpuName = StringRef("skylake-avx512");
85 }
86 mUsingAVX512 = true;
87 #else
88 mHostCpuName = StringRef("core-avx2");
89 #endif
90 if (mVWidth == 0)
91 {
92 mVWidth = 8;
93 }
94 }
95 else if (mArch.AVX2())
96 {
97 mHostCpuName = StringRef("core-avx2");
98 if (mVWidth == 0)
99 {
100 mVWidth = 8;
101 }
102 }
103 else if (mArch.AVX())
104 {
105 if (mArch.F16C())
106 {
107 mHostCpuName = StringRef("core-avx-i");
108 }
109 else
110 {
111 mHostCpuName = StringRef("corei7-avx");
112 }
113 if (mVWidth == 0)
114 {
115 mVWidth = 8;
116 }
117 }
118 else
119 {
120 SWR_INVALID("Jitting requires at least AVX ISA support");
121 }
122
123
124 mOptLevel = CodeGenOpt::Aggressive;
125
126 if (KNOB_JIT_OPTIMIZATION_LEVEL >= CodeGenOpt::None &&
127 KNOB_JIT_OPTIMIZATION_LEVEL <= CodeGenOpt::Aggressive)
128 {
129 mOptLevel = CodeGenOpt::Level(KNOB_JIT_OPTIMIZATION_LEVEL);
130 }
131
132 if (KNOB_JIT_ENABLE_CACHE)
133 {
134 mCache.Init(this, mHostCpuName, mOptLevel);
135 }
136
137 SetupNewModule();
138 mIsModuleFinalized = true;
139
140 // fetch function signature
141 #if USE_SIMD16_SHADERS
142 // typedef void(__cdecl *PFN_FETCH_FUNC)(SWR_FETCH_CONTEXT& fetchInfo, simd16vertex& out);
143 #else
144 // typedef void(__cdecl *PFN_FETCH_FUNC)(SWR_FETCH_CONTEXT& fetchInfo, simdvertex& out);
145 #endif
146 std::vector<Type*> fsArgs;
147
148 // llvm5 is picky and does not take a void * type
149 fsArgs.push_back(PointerType::get(Gen_SWR_FETCH_CONTEXT(this), 0));
150
151 fsArgs.push_back(Type::getInt8PtrTy(mContext));
152
153 fsArgs.push_back(PointerType::get(Gen_SWR_FETCH_CONTEXT(this), 0));
154 #if USE_SIMD16_SHADERS
155 fsArgs.push_back(PointerType::get(Gen_simd16vertex(this), 0));
156 #else
157 fsArgs.push_back(PointerType::get(Gen_simdvertex(this), 0));
158 #endif
159
160 mFetchShaderTy = FunctionType::get(Type::getVoidTy(mContext), fsArgs, false);
161
162 #if defined(_MSC_VER)
163 // explicitly instantiate used symbols from potentially staticly linked libs
164 sys::DynamicLibrary::AddSymbol("exp2f", &exp2f);
165 sys::DynamicLibrary::AddSymbol("log2f", &log2f);
166 sys::DynamicLibrary::AddSymbol("sinf", &sinf);
167 sys::DynamicLibrary::AddSymbol("cosf", &cosf);
168 sys::DynamicLibrary::AddSymbol("powf", &powf);
169 #endif
170
171 #if defined(_WIN32)
172 if (KNOB_DUMP_SHADER_IR)
173 {
174 CreateDirectoryPath(INTEL_OUTPUT_DIR);
175 CreateDirectoryPath(SWR_OUTPUT_DIR);
176 CreateDirectoryPath(JITTER_OUTPUT_DIR);
177 }
178 #endif
179 }
180
CreateExecEngine(std::unique_ptr<Module> pModule)181 void JitManager::CreateExecEngine(std::unique_ptr<Module> pModule)
182 {
183 TargetOptions tOpts;
184 tOpts.AllowFPOpFusion = FPOpFusion::Fast;
185 tOpts.NoInfsFPMath = false;
186 tOpts.NoNaNsFPMath = false;
187 tOpts.UnsafeFPMath = false;
188
189 // tOpts.PrintMachineCode = true;
190
191 mpExec = EngineBuilder(std::move(pModule))
192 .setTargetOptions(tOpts)
193 .setOptLevel(mOptLevel)
194 .setMCPU(mHostCpuName)
195 .create();
196
197 if (KNOB_JIT_ENABLE_CACHE)
198 {
199 mpExec->setObjectCache(&mCache);
200 }
201
202 #if LLVM_USE_INTEL_JITEVENTS
203 JITEventListener* vTune = JITEventListener::createIntelJITEventListener();
204 mpExec->RegisterJITEventListener(vTune);
205 #endif
206
207 mvExecEngines.push_back(mpExec);
208 }
209
210 //////////////////////////////////////////////////////////////////////////
211 /// @brief Create new LLVM module.
SetupNewModule()212 void JitManager::SetupNewModule()
213 {
214 SWR_ASSERT(mIsModuleFinalized == true && "Current module is not finalized!");
215
216 std::unique_ptr<Module> newModule(new Module("", mContext));
217 mpCurrentModule = newModule.get();
218 mpCurrentModule->setTargetTriple(sys::getProcessTriple());
219 CreateExecEngine(std::move(newModule));
220 mIsModuleFinalized = false;
221 }
222
223
224 DIType*
CreateDebugStructType(StructType * pType,const std::string & name,DIFile * pFile,uint32_t lineNum,const std::vector<std::pair<std::string,uint32_t>> & members)225 JitManager::CreateDebugStructType(StructType* pType,
226 const std::string& name,
227 DIFile* pFile,
228 uint32_t lineNum,
229 const std::vector<std::pair<std::string, uint32_t>>& members)
230 {
231 DIBuilder builder(*mpCurrentModule);
232 SmallVector<Metadata*, 8> ElemTypes;
233 DataLayout DL = DataLayout(mpCurrentModule);
234 uint32_t size = DL.getTypeAllocSizeInBits(pType);
235 uint32_t alignment = DL.getABITypeAlignment(pType);
236 DINode::DIFlags flags = DINode::DIFlags::FlagPublic;
237
238 DICompositeType* pDIStructTy = builder.createStructType(pFile,
239 name,
240 pFile,
241 lineNum,
242 size,
243 alignment,
244 flags,
245 nullptr,
246 builder.getOrCreateArray(ElemTypes));
247
248 // Register mapping now to break loops (in case struct contains itself or pointers to itself)
249 mDebugStructMap[pType] = pDIStructTy;
250
251 uint32_t idx = 0;
252 for (auto& elem : pType->elements())
253 {
254 std::string name = members[idx].first;
255 uint32_t lineNum = members[idx].second;
256 size = DL.getTypeAllocSizeInBits(elem);
257 alignment = DL.getABITypeAlignment(elem);
258 uint32_t offset = DL.getStructLayout(pType)->getElementOffsetInBits(idx);
259 llvm::DIType* pDebugTy = GetDebugType(elem);
260 ElemTypes.push_back(builder.createMemberType(
261 pDIStructTy, name, pFile, lineNum, size, alignment, offset, flags, pDebugTy));
262
263 idx++;
264 }
265
266 pDIStructTy->replaceElements(builder.getOrCreateArray(ElemTypes));
267 return pDIStructTy;
268 }
269
GetDebugArrayType(Type * pTy)270 DIType* JitManager::GetDebugArrayType(Type* pTy)
271 {
272 DIBuilder builder(*mpCurrentModule);
273 DataLayout DL = DataLayout(mpCurrentModule);
274 ArrayType* pArrayTy = cast<ArrayType>(pTy);
275 uint32_t size = DL.getTypeAllocSizeInBits(pArrayTy);
276 uint32_t alignment = DL.getABITypeAlignment(pArrayTy);
277
278 SmallVector<Metadata*, 8> Elems;
279 Elems.push_back(builder.getOrCreateSubrange(0, pArrayTy->getNumElements()));
280 return builder.createArrayType(
281 size, alignment, GetDebugType(pArrayTy->getElementType()), builder.getOrCreateArray(Elems));
282 }
283
284 // Create a DIType from llvm Type
GetDebugType(Type * pTy)285 DIType* JitManager::GetDebugType(Type* pTy)
286 {
287 DIBuilder builder(*mpCurrentModule);
288 Type::TypeID id = pTy->getTypeID();
289
290 switch (id)
291 {
292 case Type::VoidTyID:
293 return builder.createUnspecifiedType("void");
294 break;
295 case Type::HalfTyID:
296 return builder.createBasicType("float16", 16, dwarf::DW_ATE_float);
297 break;
298 case Type::FloatTyID:
299 return builder.createBasicType("float", 32, dwarf::DW_ATE_float);
300 break;
301 case Type::DoubleTyID:
302 return builder.createBasicType("double", 64, dwarf::DW_ATE_float);
303 break;
304 case Type::IntegerTyID:
305 return GetDebugIntegerType(pTy);
306 break;
307 case Type::StructTyID:
308 return GetDebugStructType(pTy);
309 break;
310 case Type::ArrayTyID:
311 return GetDebugArrayType(pTy);
312 break;
313 case Type::PointerTyID:
314 return builder.createPointerType(GetDebugType(pTy->getPointerElementType()), 64, 64);
315 break;
316 #if LLVM_VERSION_MAJOR >= 11
317 case Type::FixedVectorTyID:
318 #else
319 case Type::VectorTyID:
320 #endif
321 return GetDebugVectorType(pTy);
322 break;
323 case Type::FunctionTyID:
324 return GetDebugFunctionType(pTy);
325 break;
326 default:
327 SWR_ASSERT(false, "Unimplemented llvm type");
328 }
329 return nullptr;
330 }
331
332 // Create a DISubroutineType from an llvm FunctionType
GetDebugFunctionType(Type * pTy)333 DIType* JitManager::GetDebugFunctionType(Type* pTy)
334 {
335 SmallVector<Metadata*, 8> ElemTypes;
336 FunctionType* pFuncTy = cast<FunctionType>(pTy);
337 DIBuilder builder(*mpCurrentModule);
338
339 // Add result type
340 ElemTypes.push_back(GetDebugType(pFuncTy->getReturnType()));
341
342 // Add arguments
343 for (auto& param : pFuncTy->params())
344 {
345 ElemTypes.push_back(GetDebugType(param));
346 }
347
348 return builder.createSubroutineType(builder.getOrCreateTypeArray(ElemTypes));
349 }
350
GetDebugIntegerType(Type * pTy)351 DIType* JitManager::GetDebugIntegerType(Type* pTy)
352 {
353 DIBuilder builder(*mpCurrentModule);
354 IntegerType* pIntTy = cast<IntegerType>(pTy);
355 switch (pIntTy->getBitWidth())
356 {
357 case 1:
358 return builder.createBasicType("int1", 1, dwarf::DW_ATE_unsigned);
359 break;
360 case 8:
361 return builder.createBasicType("int8", 8, dwarf::DW_ATE_signed);
362 break;
363 case 16:
364 return builder.createBasicType("int16", 16, dwarf::DW_ATE_signed);
365 break;
366 case 32:
367 return builder.createBasicType("int", 32, dwarf::DW_ATE_signed);
368 break;
369 case 64:
370 return builder.createBasicType("int64", 64, dwarf::DW_ATE_signed);
371 break;
372 case 128:
373 return builder.createBasicType("int128", 128, dwarf::DW_ATE_signed);
374 break;
375 default:
376 SWR_ASSERT(false, "Unimplemented integer bit width");
377 }
378 return nullptr;
379 }
380
GetDebugVectorType(Type * pTy)381 DIType* JitManager::GetDebugVectorType(Type* pTy)
382 {
383 DIBuilder builder(*mpCurrentModule);
384 VectorType* pVecTy = cast<VectorType>(pTy);
385 DataLayout DL = DataLayout(mpCurrentModule);
386 uint32_t size = DL.getTypeAllocSizeInBits(pVecTy);
387 uint32_t alignment = DL.getABITypeAlignment(pVecTy);
388 SmallVector<Metadata*, 1> Elems;
389
390 #if LLVM_VERSION_MAJOR >= 11
391 Elems.push_back(builder.getOrCreateSubrange(0, pVecTy->getNumElements()));
392 #else
393 Elems.push_back(builder.getOrCreateSubrange(0, pVecTy->getVectorNumElements()));
394 #endif
395
396 return builder.createVectorType(size,
397 alignment,
398 #if LLVM_VERSION_MAJOR >= 11
399 GetDebugType(pVecTy->getElementType()),
400 #else
401 GetDebugType(pVecTy->getVectorElementType()),
402 #endif
403 builder.getOrCreateArray(Elems));
404 }
405
406 //////////////////////////////////////////////////////////////////////////
407 /// @brief Dump function x86 assembly to file.
408 /// @note This should only be called after the module has been jitted to x86 and the
409 /// module will not be further accessed.
DumpAsm(Function * pFunction,const char * fileName)410 void JitManager::DumpAsm(Function* pFunction, const char* fileName)
411 {
412 if (KNOB_DUMP_SHADER_IR)
413 {
414 #if defined(_WIN32)
415 DWORD pid = GetCurrentProcessId();
416 char procname[MAX_PATH];
417 GetModuleFileNameA(NULL, procname, MAX_PATH);
418 const char* pBaseName = strrchr(procname, '\\');
419 std::stringstream outDir;
420 outDir << JITTER_OUTPUT_DIR << pBaseName << "_" << pid << std::ends;
421 CreateDirectoryPath(outDir.str().c_str());
422 #endif
423
424 std::error_code EC;
425 Module* pModule = pFunction->getParent();
426 const char* funcName = pFunction->getName().data();
427 char fName[256];
428 #if defined(_WIN32)
429 sprintf(fName, "%s\\%s.%s.asm", outDir.str().c_str(), funcName, fileName);
430 #else
431 sprintf(fName, "%s.%s.asm", funcName, fileName);
432 #endif
433
434 raw_fd_ostream filestream(fName, EC, llvm::sys::fs::F_None);
435
436 legacy::PassManager* pMPasses = new legacy::PassManager();
437 auto* pTarget = mpExec->getTargetMachine();
438 pTarget->Options.MCOptions.AsmVerbose = true;
439 #if LLVM_VERSION_MAJOR >= 10
440 pTarget->addPassesToEmitFile(
441 *pMPasses, filestream, nullptr, CGFT_AssemblyFile);
442 #elif LLVM_VERSION_MAJOR >= 7
443 pTarget->addPassesToEmitFile(
444 *pMPasses, filestream, nullptr, TargetMachine::CGFT_AssemblyFile);
445 #else
446 pTarget->addPassesToEmitFile(*pMPasses, filestream, TargetMachine::CGFT_AssemblyFile);
447 #endif
448 pMPasses->run(*pModule);
449 delete pMPasses;
450 pTarget->Options.MCOptions.AsmVerbose = false;
451 }
452 }
453
GetOutputDir()454 std::string JitManager::GetOutputDir()
455 {
456 #if defined(_WIN32)
457 DWORD pid = GetCurrentProcessId();
458 char procname[MAX_PATH];
459 GetModuleFileNameA(NULL, procname, MAX_PATH);
460 const char* pBaseName = strrchr(procname, '\\');
461 std::stringstream outDir;
462 outDir << JITTER_OUTPUT_DIR << pBaseName << "_" << pid;
463 CreateDirectoryPath(outDir.str().c_str());
464 return outDir.str();
465 #endif
466 return "";
467 }
468
469 //////////////////////////////////////////////////////////////////////////
470 /// @brief Dump function to file.
DumpToFile(Module * M,const char * fileName,llvm::AssemblyAnnotationWriter * annotater)471 void JitManager::DumpToFile(Module* M,
472 const char* fileName,
473 llvm::AssemblyAnnotationWriter* annotater)
474 {
475 if (KNOB_DUMP_SHADER_IR)
476 {
477 std::string outDir = GetOutputDir();
478
479 std::error_code EC;
480 const char* funcName = M->getName().data();
481 char fName[256];
482 #if defined(_WIN32)
483 sprintf(fName, "%s\\%s.%s.ll", outDir.c_str(), funcName, fileName);
484 #else
485 sprintf(fName, "%s.%s.ll", funcName, fileName);
486 #endif
487 raw_fd_ostream fd(fName, EC, llvm::sys::fs::F_None);
488 M->print(fd, annotater);
489 fd.flush();
490 }
491 }
492
493 //////////////////////////////////////////////////////////////////////////
494 /// @brief Dump function to file.
DumpToFile(Function * f,const char * fileName)495 void JitManager::DumpToFile(Function* f, const char* fileName)
496 {
497 if (KNOB_DUMP_SHADER_IR)
498 {
499 std::string outDir = GetOutputDir();
500
501 std::error_code EC;
502 const char* funcName = f->getName().data();
503 char fName[256];
504 #if defined(_WIN32)
505 sprintf(fName, "%s\\%s.%s.ll", outDir.c_str(), funcName, fileName);
506 #else
507 sprintf(fName, "%s.%s.ll", funcName, fileName);
508 #endif
509 raw_fd_ostream fd(fName, EC, llvm::sys::fs::F_None);
510 f->print(fd, nullptr);
511
512 #if defined(_WIN32)
513 sprintf(fName, "%s\\cfg.%s.%s.dot", outDir.c_str(), funcName, fileName);
514 #else
515 sprintf(fName, "cfg.%s.%s.dot", funcName, fileName);
516 #endif
517 fd.flush();
518
519 raw_fd_ostream fd_cfg(fName, EC, llvm::sys::fs::F_Text);
520 WriteGraph(fd_cfg, (const Function*)f);
521
522 fd_cfg.flush();
523 }
524 }
525
526 extern "C" {
527 bool g_DllActive = true;
528
529 //////////////////////////////////////////////////////////////////////////
530 /// @brief Create JIT context.
531 /// @param simdWidth - SIMD width to be used in generated program.
JitCreateContext(uint32_t targetSimdWidth,const char * arch,const char * core)532 HANDLE JITCALL JitCreateContext(uint32_t targetSimdWidth, const char* arch, const char* core)
533 {
534 return new JitManager(targetSimdWidth, arch, core);
535 }
536
537 //////////////////////////////////////////////////////////////////////////
538 /// @brief Destroy JIT context.
JitDestroyContext(HANDLE hJitContext)539 void JITCALL JitDestroyContext(HANDLE hJitContext)
540 {
541 if (g_DllActive)
542 {
543 delete reinterpret_cast<JitManager*>(hJitContext);
544 }
545 }
546 }
547
548 //////////////////////////////////////////////////////////////////////////
549 /// JitCache
550 //////////////////////////////////////////////////////////////////////////
551
552 //////////////////////////////////////////////////////////////////////////
553 /// JitCacheFileHeader
554 //////////////////////////////////////////////////////////////////////////
555 struct JitCacheFileHeader
556 {
InitJitCacheFileHeader557 void Init(uint32_t llCRC,
558 uint32_t objCRC,
559 const std::string& moduleID,
560 const std::string& cpu,
561 uint32_t optLevel,
562 uint64_t objSize)
563 {
564 m_objSize = objSize;
565 m_llCRC = llCRC;
566 m_objCRC = objCRC;
567 strncpy(m_ModuleID, moduleID.c_str(), JC_STR_MAX_LEN - 1);
568 m_ModuleID[JC_STR_MAX_LEN - 1] = 0;
569 strncpy(m_Cpu, cpu.c_str(), JC_STR_MAX_LEN - 1);
570 m_Cpu[JC_STR_MAX_LEN - 1] = 0;
571 m_optLevel = optLevel;
572 }
573
574
575 bool
IsValidJitCacheFileHeader576 IsValid(uint32_t llCRC, const std::string& moduleID, const std::string& cpu, uint32_t optLevel)
577 {
578 if ((m_MagicNumber != JC_MAGIC_NUMBER) || (m_llCRC != llCRC) ||
579 (m_platformKey != JC_PLATFORM_KEY) || (m_optLevel != optLevel))
580 {
581 return false;
582 }
583
584 m_ModuleID[JC_STR_MAX_LEN - 1] = 0;
585 if (strncmp(moduleID.c_str(), m_ModuleID, JC_STR_MAX_LEN - 1))
586 {
587 return false;
588 }
589
590 m_Cpu[JC_STR_MAX_LEN - 1] = 0;
591 if (strncmp(cpu.c_str(), m_Cpu, JC_STR_MAX_LEN - 1))
592 {
593 return false;
594 }
595
596 return true;
597 }
598
GetObjectSizeJitCacheFileHeader599 uint64_t GetObjectSize() const { return m_objSize; }
GetObjectCRCJitCacheFileHeader600 uint64_t GetObjectCRC() const { return m_objCRC; }
601
602 private:
603 static const uint64_t JC_MAGIC_NUMBER = 0xfedcba9876543210ULL + 7;
604 static const size_t JC_STR_MAX_LEN = 32;
605 static const uint32_t JC_PLATFORM_KEY = (LLVM_VERSION_MAJOR << 24) |
606 (LLVM_VERSION_MINOR << 16) | (LLVM_VERSION_PATCH << 8) |
607 ((sizeof(void*) > sizeof(uint32_t)) ? 1 : 0);
608
609 uint64_t m_MagicNumber = JC_MAGIC_NUMBER;
610 uint64_t m_objSize = 0;
611 uint32_t m_llCRC = 0;
612 uint32_t m_platformKey = JC_PLATFORM_KEY;
613 uint32_t m_objCRC = 0;
614 uint32_t m_optLevel = 0;
615 char m_ModuleID[JC_STR_MAX_LEN] = {};
616 char m_Cpu[JC_STR_MAX_LEN] = {};
617 };
618
ComputeModuleCRC(const llvm::Module * M)619 static inline uint32_t ComputeModuleCRC(const llvm::Module* M)
620 {
621 std::string bitcodeBuffer;
622 raw_string_ostream bitcodeStream(bitcodeBuffer);
623
624 #if LLVM_VERSION_MAJOR >= 7
625 llvm::WriteBitcodeToFile(*M, bitcodeStream);
626 #else
627 llvm::WriteBitcodeToFile(M, bitcodeStream);
628 #endif
629 // M->print(bitcodeStream, nullptr, false);
630
631 bitcodeStream.flush();
632
633 return ComputeCRC(0, bitcodeBuffer.data(), bitcodeBuffer.size());
634 }
635
636 /// constructor
JitCache()637 JitCache::JitCache()
638 {
639 #if defined(__APPLE__) || defined(FORCE_LINUX) || defined(__linux__) || defined(__gnu_linux__)
640 if (strncmp(KNOB_JIT_CACHE_DIR.c_str(), "~/", 2) == 0)
641 {
642 char* homedir;
643 if (!(homedir = getenv("HOME")))
644 {
645 homedir = getpwuid(getuid())->pw_dir;
646 }
647 mCacheDir = homedir;
648 mCacheDir += (KNOB_JIT_CACHE_DIR.c_str() + 1);
649 }
650 else
651 #endif
652 {
653 mCacheDir = KNOB_JIT_CACHE_DIR;
654 }
655
656 // Create cache dir at startup to allow jitter to write debug.ll files
657 // to that directory.
658 if (!llvm::sys::fs::exists(mCacheDir.str()) &&
659 llvm::sys::fs::create_directories(mCacheDir.str()))
660 {
661 SWR_INVALID("Unable to create directory: %s", mCacheDir.c_str());
662 }
663
664 }
665
ExecUnhookedProcess(const std::string & CmdLine,std::string * pStdOut,std::string * pStdErr)666 int ExecUnhookedProcess(const std::string& CmdLine, std::string* pStdOut, std::string* pStdErr)
667 {
668
669 return ExecCmd(CmdLine, nullptr, pStdOut, pStdErr);
670 }
671
672 /// Calculate actual directory where module will be cached.
673 /// This is always a subdirectory of mCacheDir. Full absolute
674 /// path name will be stored in mCurrentModuleCacheDir
CalcModuleCacheDir()675 void JitCache::CalcModuleCacheDir()
676 {
677 mModuleCacheDir.clear();
678
679 llvm::SmallString<MAX_PATH> moduleDir = mCacheDir;
680
681 // Create 4 levels of directory hierarchy based on CRC, 256 entries each
682 uint8_t* pCRC = (uint8_t*)&mCurrentModuleCRC;
683 for (uint32_t i = 0; i < 4; ++i)
684 {
685 llvm::sys::path::append(moduleDir, std::to_string((int)pCRC[i]));
686 }
687
688 mModuleCacheDir = moduleDir;
689 }
690
691 /// notifyObjectCompiled - Provides a pointer to compiled code for Module M.
notifyObjectCompiled(const llvm::Module * M,llvm::MemoryBufferRef Obj)692 void JitCache::notifyObjectCompiled(const llvm::Module* M, llvm::MemoryBufferRef Obj)
693 {
694 const std::string& moduleID = M->getModuleIdentifier();
695 if (!moduleID.length())
696 {
697 return;
698 }
699
700 if (!mModuleCacheDir.size())
701 {
702 SWR_INVALID("Unset module cache directory");
703 return;
704 }
705
706 if (!llvm::sys::fs::exists(mModuleCacheDir.str()) &&
707 llvm::sys::fs::create_directories(mModuleCacheDir.str()))
708 {
709 SWR_INVALID("Unable to create directory: %s", mModuleCacheDir.c_str());
710 return;
711 }
712
713 JitCacheFileHeader header;
714
715 llvm::SmallString<MAX_PATH> filePath = mModuleCacheDir;
716 llvm::sys::path::append(filePath, moduleID);
717
718 llvm::SmallString<MAX_PATH> objPath = filePath;
719 objPath += JIT_OBJ_EXT;
720
721 {
722 std::error_code err;
723 llvm::raw_fd_ostream fileObj(objPath.c_str(), err, llvm::sys::fs::F_None);
724 fileObj << Obj.getBuffer();
725 fileObj.flush();
726 }
727
728
729 {
730 std::error_code err;
731 llvm::raw_fd_ostream fileObj(filePath.c_str(), err, llvm::sys::fs::F_None);
732
733 uint32_t objcrc = ComputeCRC(0, Obj.getBufferStart(), Obj.getBufferSize());
734
735 header.Init(mCurrentModuleCRC, objcrc, moduleID, mCpu, mOptLevel, Obj.getBufferSize());
736
737 fileObj.write((const char*)&header, sizeof(header));
738 fileObj.flush();
739 }
740 }
741
742 /// Returns a pointer to a newly allocated MemoryBuffer that contains the
743 /// object which corresponds with Module M, or 0 if an object is not
744 /// available.
getObject(const llvm::Module * M)745 std::unique_ptr<llvm::MemoryBuffer> JitCache::getObject(const llvm::Module* M)
746 {
747 const std::string& moduleID = M->getModuleIdentifier();
748 mCurrentModuleCRC = ComputeModuleCRC(M);
749
750 if (!moduleID.length())
751 {
752 return nullptr;
753 }
754
755 CalcModuleCacheDir();
756
757 if (!llvm::sys::fs::exists(mModuleCacheDir))
758 {
759 return nullptr;
760 }
761
762 llvm::SmallString<MAX_PATH> filePath = mModuleCacheDir;
763 llvm::sys::path::append(filePath, moduleID);
764
765 llvm::SmallString<MAX_PATH> objFilePath = filePath;
766 objFilePath += JIT_OBJ_EXT;
767
768 FILE* fpObjIn = nullptr;
769 FILE* fpIn = fopen(filePath.c_str(), "rb");
770 if (!fpIn)
771 {
772 return nullptr;
773 }
774
775 std::unique_ptr<llvm::MemoryBuffer> pBuf = nullptr;
776 do
777 {
778 JitCacheFileHeader header;
779 if (!fread(&header, sizeof(header), 1, fpIn))
780 {
781 break;
782 }
783
784 if (!header.IsValid(mCurrentModuleCRC, moduleID, mCpu, mOptLevel))
785 {
786 break;
787 }
788
789 fpObjIn = fopen(objFilePath.c_str(), "rb");
790 if (!fpObjIn)
791 {
792 break;
793 }
794
795 #if LLVM_VERSION_MAJOR < 6
796 pBuf = llvm::MemoryBuffer::getNewUninitMemBuffer(size_t(header.GetObjectSize()));
797 #else
798 pBuf = llvm::WritableMemoryBuffer::getNewUninitMemBuffer(size_t(header.GetObjectSize()));
799 #endif
800 if (!fread(const_cast<char*>(pBuf->getBufferStart()), header.GetObjectSize(), 1, fpObjIn))
801 {
802 pBuf = nullptr;
803 break;
804 }
805
806 if (header.GetObjectCRC() != ComputeCRC(0, pBuf->getBufferStart(), pBuf->getBufferSize()))
807 {
808 SWR_TRACE("Invalid object cache file, ignoring: %s", filePath.c_str());
809 pBuf = nullptr;
810 break;
811 }
812
813 } while (0);
814
815 fclose(fpIn);
816
817 if (fpObjIn)
818 {
819 fclose(fpObjIn);
820 }
821
822
823 return pBuf;
824 }
825
emitInstructionAnnot(const llvm::Instruction * pInst,llvm::formatted_raw_ostream & OS)826 void InterleaveAssemblyAnnotater::emitInstructionAnnot(const llvm::Instruction* pInst,
827 llvm::formatted_raw_ostream& OS)
828 {
829 auto dbgLoc = pInst->getDebugLoc();
830 if (dbgLoc)
831 {
832 unsigned int line = dbgLoc.getLine();
833 if (line != mCurrentLineNo)
834 {
835 if (line > 0 && line <= mAssembly.size())
836 {
837 // HACK: here we assume that OS is a formatted_raw_ostream(ods())
838 // and modify the color accordingly. We can't do the color
839 // modification on OS because formatted_raw_ostream strips
840 // the color information. The only way to fix this behavior
841 // is to patch LLVM.
842 OS << "\n; " << line << ": " << mAssembly[line - 1] << "\n";
843 }
844 mCurrentLineNo = line;
845 }
846 }
847 }
848