swr/rasterizer: improvements in simdlib
[mesa.git] / src / gallium / drivers / swr / rasterizer / jitter / JitManager.cpp
1 /****************************************************************************
2 * Copyright (C) 2014-2018 Intel Corporation. All Rights Reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * @file JitManager.cpp
24 *
25 * @brief Implementation if the Jit Manager.
26 *
27 * Notes:
28 *
29 ******************************************************************************/
30 #include "jit_pch.hpp"
31
32 #include "JitManager.h"
33 #include "jit_api.h"
34 #include "fetch_jit.h"
35
36 #include "core/state.h"
37
38 #include "gen_state_llvm.h"
39
40 #include <sstream>
41 #if defined(_WIN32)
42 #include <psapi.h>
43 #include <cstring>
44
45 #define INTEL_OUTPUT_DIR "c:\\Intel"
46 #define SWR_OUTPUT_DIR INTEL_OUTPUT_DIR "\\SWR"
47 #define JITTER_OUTPUT_DIR SWR_OUTPUT_DIR "\\Jitter"
48 #endif // _WIN32
49
50 #if defined(__APPLE__) || defined(FORCE_LINUX) || defined(__linux__) || defined(__gnu_linux__)
51 #include <pwd.h>
52 #include <sys/stat.h>
53 #endif
54
55
56 using namespace llvm;
57 using namespace SwrJit;
58
59 //////////////////////////////////////////////////////////////////////////
60 /// @brief Contructor for JitManager.
61 /// @param simdWidth - SIMD width to be used in generated program.
62 JitManager::JitManager(uint32_t simdWidth, const char* arch, const char* core) :
63 mContext(), mBuilder(mContext), mIsModuleFinalized(true), mJitNumber(0), mVWidth(simdWidth),
64 mArch(arch)
65 {
66 mpCurrentModule = nullptr;
67 mpExec = nullptr;
68
69 InitializeNativeTarget();
70 InitializeNativeTargetAsmPrinter();
71 InitializeNativeTargetDisassembler();
72
73
74 // force JIT to use the same CPU arch as the rest of swr
75 if (mArch.AVX512F())
76 {
77 #if USE_SIMD16_SHADERS
78 if (mArch.AVX512ER())
79 {
80 mHostCpuName = StringRef("knl");
81 }
82 else
83 {
84 mHostCpuName = StringRef("skylake-avx512");
85 }
86 mUsingAVX512 = true;
87 #else
88 mHostCpuName = StringRef("core-avx2");
89 #endif
90 if (mVWidth == 0)
91 {
92 mVWidth = 8;
93 }
94 }
95 else if (mArch.AVX2())
96 {
97 mHostCpuName = StringRef("core-avx2");
98 if (mVWidth == 0)
99 {
100 mVWidth = 8;
101 }
102 }
103 else if (mArch.AVX())
104 {
105 if (mArch.F16C())
106 {
107 mHostCpuName = StringRef("core-avx-i");
108 }
109 else
110 {
111 mHostCpuName = StringRef("corei7-avx");
112 }
113 if (mVWidth == 0)
114 {
115 mVWidth = 8;
116 }
117 }
118 else
119 {
120 SWR_INVALID("Jitting requires at least AVX ISA support");
121 }
122
123
124 mOptLevel = CodeGenOpt::Aggressive;
125
126 if (KNOB_JIT_OPTIMIZATION_LEVEL >= CodeGenOpt::None &&
127 KNOB_JIT_OPTIMIZATION_LEVEL <= CodeGenOpt::Aggressive)
128 {
129 mOptLevel = CodeGenOpt::Level(KNOB_JIT_OPTIMIZATION_LEVEL);
130 }
131
132 if (KNOB_JIT_ENABLE_CACHE)
133 {
134 mCache.Init(this, mHostCpuName, mOptLevel);
135 }
136
137 SetupNewModule();
138 mIsModuleFinalized = true;
139
140 // fetch function signature
141 #if USE_SIMD16_SHADERS
142 // typedef void(__cdecl *PFN_FETCH_FUNC)(SWR_FETCH_CONTEXT& fetchInfo, simd16vertex& out);
143 #else
144 // typedef void(__cdecl *PFN_FETCH_FUNC)(SWR_FETCH_CONTEXT& fetchInfo, simdvertex& out);
145 #endif
146 std::vector<Type*> fsArgs;
147
148 // llvm5 is picky and does not take a void * type
149 fsArgs.push_back(PointerType::get(Gen_SWR_FETCH_CONTEXT(this), 0));
150
151 fsArgs.push_back(Type::getInt8PtrTy(mContext));
152
153 fsArgs.push_back(PointerType::get(Gen_SWR_FETCH_CONTEXT(this), 0));
154 #if USE_SIMD16_SHADERS
155 fsArgs.push_back(PointerType::get(Gen_simd16vertex(this), 0));
156 #else
157 fsArgs.push_back(PointerType::get(Gen_simdvertex(this), 0));
158 #endif
159
160 mFetchShaderTy = FunctionType::get(Type::getVoidTy(mContext), fsArgs, false);
161
162 #if defined(_WIN32)
163 // explicitly instantiate used symbols from potentially staticly linked libs
164 sys::DynamicLibrary::AddSymbol("exp2f", &exp2f);
165 sys::DynamicLibrary::AddSymbol("log2f", &log2f);
166 sys::DynamicLibrary::AddSymbol("sinf", &sinf);
167 sys::DynamicLibrary::AddSymbol("cosf", &cosf);
168 sys::DynamicLibrary::AddSymbol("powf", &powf);
169 #endif
170
171 #if defined(_WIN32)
172 if (KNOB_DUMP_SHADER_IR)
173 {
174 CreateDirectoryPath(INTEL_OUTPUT_DIR);
175 CreateDirectoryPath(SWR_OUTPUT_DIR);
176 CreateDirectoryPath(JITTER_OUTPUT_DIR);
177 }
178 #endif
179 }
180
181 void JitManager::CreateExecEngine(std::unique_ptr<Module> pModule)
182 {
183 TargetOptions tOpts;
184 tOpts.AllowFPOpFusion = FPOpFusion::Fast;
185 tOpts.NoInfsFPMath = false;
186 tOpts.NoNaNsFPMath = false;
187 tOpts.UnsafeFPMath = false;
188
189 // tOpts.PrintMachineCode = true;
190
191 mpExec = EngineBuilder(std::move(pModule))
192 .setTargetOptions(tOpts)
193 .setOptLevel(mOptLevel)
194 .setMCPU(mHostCpuName)
195 .create();
196
197 if (KNOB_JIT_ENABLE_CACHE)
198 {
199 mpExec->setObjectCache(&mCache);
200 }
201
202 #if LLVM_USE_INTEL_JITEVENTS
203 JITEventListener* vTune = JITEventListener::createIntelJITEventListener();
204 mpExec->RegisterJITEventListener(vTune);
205 #endif
206
207 mvExecEngines.push_back(mpExec);
208 }
209
210 //////////////////////////////////////////////////////////////////////////
211 /// @brief Create new LLVM module.
212 void JitManager::SetupNewModule()
213 {
214 SWR_ASSERT(mIsModuleFinalized == true && "Current module is not finalized!");
215
216 std::unique_ptr<Module> newModule(new Module("", mContext));
217 mpCurrentModule = newModule.get();
218 mpCurrentModule->setTargetTriple(sys::getProcessTriple());
219 CreateExecEngine(std::move(newModule));
220 mIsModuleFinalized = false;
221 }
222
223
224 DIType*
225 JitManager::CreateDebugStructType(StructType* pType,
226 const std::string& name,
227 DIFile* pFile,
228 uint32_t lineNum,
229 const std::vector<std::pair<std::string, uint32_t>>& members)
230 {
231 DIBuilder builder(*mpCurrentModule);
232 SmallVector<Metadata*, 8> ElemTypes;
233 DataLayout DL = DataLayout(mpCurrentModule);
234 uint32_t size = DL.getTypeAllocSizeInBits(pType);
235 uint32_t alignment = DL.getABITypeAlignment(pType);
236 DINode::DIFlags flags = DINode::DIFlags::FlagPublic;
237
238 DICompositeType* pDIStructTy = builder.createStructType(pFile,
239 name,
240 pFile,
241 lineNum,
242 size,
243 alignment,
244 flags,
245 nullptr,
246 builder.getOrCreateArray(ElemTypes));
247
248 // Register mapping now to break loops (in case struct contains itself or pointers to itself)
249 mDebugStructMap[pType] = pDIStructTy;
250
251 uint32_t idx = 0;
252 for (auto& elem : pType->elements())
253 {
254 std::string name = members[idx].first;
255 uint32_t lineNum = members[idx].second;
256 size = DL.getTypeAllocSizeInBits(elem);
257 alignment = DL.getABITypeAlignment(elem);
258 uint32_t offset = DL.getStructLayout(pType)->getElementOffsetInBits(idx);
259 llvm::DIType* pDebugTy = GetDebugType(elem);
260 ElemTypes.push_back(builder.createMemberType(
261 pDIStructTy, name, pFile, lineNum, size, alignment, offset, flags, pDebugTy));
262
263 idx++;
264 }
265
266 pDIStructTy->replaceElements(builder.getOrCreateArray(ElemTypes));
267 return pDIStructTy;
268 }
269
270 DIType* JitManager::GetDebugArrayType(Type* pTy)
271 {
272 DIBuilder builder(*mpCurrentModule);
273 DataLayout DL = DataLayout(mpCurrentModule);
274 ArrayType* pArrayTy = cast<ArrayType>(pTy);
275 uint32_t size = DL.getTypeAllocSizeInBits(pArrayTy);
276 uint32_t alignment = DL.getABITypeAlignment(pArrayTy);
277
278 SmallVector<Metadata*, 8> Elems;
279 Elems.push_back(builder.getOrCreateSubrange(0, pArrayTy->getNumElements()));
280 return builder.createArrayType(
281 size, alignment, GetDebugType(pArrayTy->getElementType()), builder.getOrCreateArray(Elems));
282 }
283
284 // Create a DIType from llvm Type
285 DIType* JitManager::GetDebugType(Type* pTy)
286 {
287 DIBuilder builder(*mpCurrentModule);
288 Type::TypeID id = pTy->getTypeID();
289
290 switch (id)
291 {
292 case Type::VoidTyID:
293 return builder.createUnspecifiedType("void");
294 break;
295 case Type::HalfTyID:
296 return builder.createBasicType("float16", 16, dwarf::DW_ATE_float);
297 break;
298 case Type::FloatTyID:
299 return builder.createBasicType("float", 32, dwarf::DW_ATE_float);
300 break;
301 case Type::DoubleTyID:
302 return builder.createBasicType("double", 64, dwarf::DW_ATE_float);
303 break;
304 case Type::IntegerTyID:
305 return GetDebugIntegerType(pTy);
306 break;
307 case Type::StructTyID:
308 return GetDebugStructType(pTy);
309 break;
310 case Type::ArrayTyID:
311 return GetDebugArrayType(pTy);
312 break;
313 case Type::PointerTyID:
314 return builder.createPointerType(GetDebugType(pTy->getPointerElementType()), 64, 64);
315 break;
316 case Type::VectorTyID:
317 return GetDebugVectorType(pTy);
318 break;
319 case Type::FunctionTyID:
320 return GetDebugFunctionType(pTy);
321 break;
322 default:
323 SWR_ASSERT(false, "Unimplemented llvm type");
324 }
325 return nullptr;
326 }
327
328 // Create a DISubroutineType from an llvm FunctionType
329 DIType* JitManager::GetDebugFunctionType(Type* pTy)
330 {
331 SmallVector<Metadata*, 8> ElemTypes;
332 FunctionType* pFuncTy = cast<FunctionType>(pTy);
333 DIBuilder builder(*mpCurrentModule);
334
335 // Add result type
336 ElemTypes.push_back(GetDebugType(pFuncTy->getReturnType()));
337
338 // Add arguments
339 for (auto& param : pFuncTy->params())
340 {
341 ElemTypes.push_back(GetDebugType(param));
342 }
343
344 return builder.createSubroutineType(builder.getOrCreateTypeArray(ElemTypes));
345 }
346
347 DIType* JitManager::GetDebugIntegerType(Type* pTy)
348 {
349 DIBuilder builder(*mpCurrentModule);
350 IntegerType* pIntTy = cast<IntegerType>(pTy);
351 switch (pIntTy->getBitWidth())
352 {
353 case 1:
354 return builder.createBasicType("int1", 1, dwarf::DW_ATE_unsigned);
355 break;
356 case 8:
357 return builder.createBasicType("int8", 8, dwarf::DW_ATE_signed);
358 break;
359 case 16:
360 return builder.createBasicType("int16", 16, dwarf::DW_ATE_signed);
361 break;
362 case 32:
363 return builder.createBasicType("int", 32, dwarf::DW_ATE_signed);
364 break;
365 case 64:
366 return builder.createBasicType("int64", 64, dwarf::DW_ATE_signed);
367 break;
368 case 128:
369 return builder.createBasicType("int128", 128, dwarf::DW_ATE_signed);
370 break;
371 default:
372 SWR_ASSERT(false, "Unimplemented integer bit width");
373 }
374 return nullptr;
375 }
376
377 DIType* JitManager::GetDebugVectorType(Type* pTy)
378 {
379 DIBuilder builder(*mpCurrentModule);
380 VectorType* pVecTy = cast<VectorType>(pTy);
381 DataLayout DL = DataLayout(mpCurrentModule);
382 uint32_t size = DL.getTypeAllocSizeInBits(pVecTy);
383 uint32_t alignment = DL.getABITypeAlignment(pVecTy);
384 SmallVector<Metadata*, 1> Elems;
385 Elems.push_back(builder.getOrCreateSubrange(0, pVecTy->getVectorNumElements()));
386
387 return builder.createVectorType(size,
388 alignment,
389 GetDebugType(pVecTy->getVectorElementType()),
390 builder.getOrCreateArray(Elems));
391 }
392
393 //////////////////////////////////////////////////////////////////////////
394 /// @brief Dump function x86 assembly to file.
395 /// @note This should only be called after the module has been jitted to x86 and the
396 /// module will not be further accessed.
397 void JitManager::DumpAsm(Function* pFunction, const char* fileName)
398 {
399 if (KNOB_DUMP_SHADER_IR)
400 {
401 #if defined(_WIN32)
402 DWORD pid = GetCurrentProcessId();
403 char procname[MAX_PATH];
404 GetModuleFileNameA(NULL, procname, MAX_PATH);
405 const char* pBaseName = strrchr(procname, '\\');
406 std::stringstream outDir;
407 outDir << JITTER_OUTPUT_DIR << pBaseName << "_" << pid << std::ends;
408 CreateDirectoryPath(outDir.str().c_str());
409 #endif
410
411 std::error_code EC;
412 Module* pModule = pFunction->getParent();
413 const char* funcName = pFunction->getName().data();
414 char fName[256];
415 #if defined(_WIN32)
416 sprintf(fName, "%s\\%s.%s.asm", outDir.str().c_str(), funcName, fileName);
417 #else
418 sprintf(fName, "%s.%s.asm", funcName, fileName);
419 #endif
420
421 raw_fd_ostream filestream(fName, EC, llvm::sys::fs::F_None);
422
423 legacy::PassManager* pMPasses = new legacy::PassManager();
424 auto* pTarget = mpExec->getTargetMachine();
425 pTarget->Options.MCOptions.AsmVerbose = true;
426 #if LLVM_VERSION_MAJOR >= 7
427 pTarget->addPassesToEmitFile(
428 *pMPasses, filestream, nullptr, TargetMachine::CGFT_AssemblyFile);
429 #else
430 pTarget->addPassesToEmitFile(*pMPasses, filestream, TargetMachine::CGFT_AssemblyFile);
431 #endif
432 pMPasses->run(*pModule);
433 delete pMPasses;
434 pTarget->Options.MCOptions.AsmVerbose = false;
435 }
436 }
437
438 std::string JitManager::GetOutputDir()
439 {
440 #if defined(_WIN32)
441 DWORD pid = GetCurrentProcessId();
442 char procname[MAX_PATH];
443 GetModuleFileNameA(NULL, procname, MAX_PATH);
444 const char* pBaseName = strrchr(procname, '\\');
445 std::stringstream outDir;
446 outDir << JITTER_OUTPUT_DIR << pBaseName << "_" << pid;
447 CreateDirectoryPath(outDir.str().c_str());
448 return outDir.str();
449 #endif
450 return "";
451 }
452
453 //////////////////////////////////////////////////////////////////////////
454 /// @brief Dump function to file.
455 void JitManager::DumpToFile(Module* M,
456 const char* fileName,
457 llvm::AssemblyAnnotationWriter* annotater)
458 {
459 if (KNOB_DUMP_SHADER_IR)
460 {
461 std::string outDir = GetOutputDir();
462
463 std::error_code EC;
464 const char* funcName = M->getName().data();
465 char fName[256];
466 #if defined(_WIN32)
467 sprintf(fName, "%s\\%s.%s.ll", outDir.c_str(), funcName, fileName);
468 #else
469 sprintf(fName, "%s.%s.ll", funcName, fileName);
470 #endif
471 raw_fd_ostream fd(fName, EC, llvm::sys::fs::F_None);
472 M->print(fd, annotater);
473 fd.flush();
474 }
475 }
476
477 //////////////////////////////////////////////////////////////////////////
478 /// @brief Dump function to file.
479 void JitManager::DumpToFile(Function* f, const char* fileName)
480 {
481 if (KNOB_DUMP_SHADER_IR)
482 {
483 std::string outDir = GetOutputDir();
484
485 std::error_code EC;
486 const char* funcName = f->getName().data();
487 char fName[256];
488 #if defined(_WIN32)
489 sprintf(fName, "%s\\%s.%s.ll", outDir.c_str(), funcName, fileName);
490 #else
491 sprintf(fName, "%s.%s.ll", funcName, fileName);
492 #endif
493 raw_fd_ostream fd(fName, EC, llvm::sys::fs::F_None);
494 f->print(fd, nullptr);
495
496 #if defined(_WIN32)
497 sprintf(fName, "%s\\cfg.%s.%s.dot", outDir.c_str(), funcName, fileName);
498 #else
499 sprintf(fName, "cfg.%s.%s.dot", funcName, fileName);
500 #endif
501 fd.flush();
502
503 raw_fd_ostream fd_cfg(fName, EC, llvm::sys::fs::F_Text);
504 WriteGraph(fd_cfg, (const Function*)f);
505
506 fd_cfg.flush();
507 }
508 }
509
510 extern "C" {
511 bool g_DllActive = true;
512
513 //////////////////////////////////////////////////////////////////////////
514 /// @brief Create JIT context.
515 /// @param simdWidth - SIMD width to be used in generated program.
516 HANDLE JITCALL JitCreateContext(uint32_t targetSimdWidth, const char* arch, const char* core)
517 {
518 return new JitManager(targetSimdWidth, arch, core);
519 }
520
521 //////////////////////////////////////////////////////////////////////////
522 /// @brief Destroy JIT context.
523 void JITCALL JitDestroyContext(HANDLE hJitContext)
524 {
525 if (g_DllActive)
526 {
527 delete reinterpret_cast<JitManager*>(hJitContext);
528 }
529 }
530 }
531
532 //////////////////////////////////////////////////////////////////////////
533 /// JitCache
534 //////////////////////////////////////////////////////////////////////////
535
536 //////////////////////////////////////////////////////////////////////////
537 /// JitCacheFileHeader
538 //////////////////////////////////////////////////////////////////////////
539 struct JitCacheFileHeader
540 {
541 void Init(uint32_t llCRC,
542 uint32_t objCRC,
543 const std::string& moduleID,
544 const std::string& cpu,
545 uint32_t optLevel,
546 uint64_t objSize)
547 {
548 m_objSize = objSize;
549 m_llCRC = llCRC;
550 m_objCRC = objCRC;
551 strncpy(m_ModuleID, moduleID.c_str(), JC_STR_MAX_LEN - 1);
552 m_ModuleID[JC_STR_MAX_LEN - 1] = 0;
553 strncpy(m_Cpu, cpu.c_str(), JC_STR_MAX_LEN - 1);
554 m_Cpu[JC_STR_MAX_LEN - 1] = 0;
555 m_optLevel = optLevel;
556 }
557
558
559 bool
560 IsValid(uint32_t llCRC, const std::string& moduleID, const std::string& cpu, uint32_t optLevel)
561 {
562 if ((m_MagicNumber != JC_MAGIC_NUMBER) || (m_llCRC != llCRC) ||
563 (m_platformKey != JC_PLATFORM_KEY) || (m_optLevel != optLevel))
564 {
565 return false;
566 }
567
568 m_ModuleID[JC_STR_MAX_LEN - 1] = 0;
569 if (strncmp(moduleID.c_str(), m_ModuleID, JC_STR_MAX_LEN - 1))
570 {
571 return false;
572 }
573
574 m_Cpu[JC_STR_MAX_LEN - 1] = 0;
575 if (strncmp(cpu.c_str(), m_Cpu, JC_STR_MAX_LEN - 1))
576 {
577 return false;
578 }
579
580 return true;
581 }
582
583 uint64_t GetObjectSize() const { return m_objSize; }
584 uint64_t GetObjectCRC() const { return m_objCRC; }
585
586 private:
587 static const uint64_t JC_MAGIC_NUMBER = 0xfedcba9876543210ULL + 7;
588 static const size_t JC_STR_MAX_LEN = 32;
589 static const uint32_t JC_PLATFORM_KEY = (LLVM_VERSION_MAJOR << 24) |
590 (LLVM_VERSION_MINOR << 16) | (LLVM_VERSION_PATCH << 8) |
591 ((sizeof(void*) > sizeof(uint32_t)) ? 1 : 0);
592
593 uint64_t m_MagicNumber = JC_MAGIC_NUMBER;
594 uint64_t m_objSize = 0;
595 uint32_t m_llCRC = 0;
596 uint32_t m_platformKey = JC_PLATFORM_KEY;
597 uint32_t m_objCRC = 0;
598 uint32_t m_optLevel = 0;
599 char m_ModuleID[JC_STR_MAX_LEN] = {};
600 char m_Cpu[JC_STR_MAX_LEN] = {};
601 };
602
603 static inline uint32_t ComputeModuleCRC(const llvm::Module* M)
604 {
605 std::string bitcodeBuffer;
606 raw_string_ostream bitcodeStream(bitcodeBuffer);
607
608 #if LLVM_VERSION_MAJOR >= 7
609 llvm::WriteBitcodeToFile(*M, bitcodeStream);
610 #else
611 llvm::WriteBitcodeToFile(M, bitcodeStream);
612 #endif
613 // M->print(bitcodeStream, nullptr, false);
614
615 bitcodeStream.flush();
616
617 return ComputeCRC(0, bitcodeBuffer.data(), bitcodeBuffer.size());
618 }
619
620 /// constructor
621 JitCache::JitCache()
622 {
623 #if defined(__APPLE__) || defined(FORCE_LINUX) || defined(__linux__) || defined(__gnu_linux__)
624 if (strncmp(KNOB_JIT_CACHE_DIR.c_str(), "~/", 2) == 0)
625 {
626 char* homedir;
627 if (!(homedir = getenv("HOME")))
628 {
629 homedir = getpwuid(getuid())->pw_dir;
630 }
631 mCacheDir = homedir;
632 mCacheDir += (KNOB_JIT_CACHE_DIR.c_str() + 1);
633 }
634 else
635 #endif
636 {
637 mCacheDir = KNOB_JIT_CACHE_DIR;
638 }
639
640 // Create cache dir at startup to allow jitter to write debug.ll files
641 // to that directory.
642 if (!llvm::sys::fs::exists(mCacheDir.str()) &&
643 llvm::sys::fs::create_directories(mCacheDir.str()))
644 {
645 SWR_INVALID("Unable to create directory: %s", mCacheDir.c_str());
646 }
647
648 }
649
650 int ExecUnhookedProcess(const std::string& CmdLine, std::string* pStdOut, std::string* pStdErr)
651 {
652 return ExecCmd(CmdLine, "", pStdOut, pStdErr);
653 }
654
655 /// Calculate actual directory where module will be cached.
656 /// This is always a subdirectory of mCacheDir. Full absolute
657 /// path name will be stored in mCurrentModuleCacheDir
658 void JitCache::CalcModuleCacheDir()
659 {
660 mModuleCacheDir.clear();
661
662 llvm::SmallString<MAX_PATH> moduleDir = mCacheDir;
663
664 // Create 4 levels of directory hierarchy based on CRC, 256 entries each
665 uint8_t* pCRC = (uint8_t*)&mCurrentModuleCRC;
666 for (uint32_t i = 0; i < 4; ++i)
667 {
668 llvm::sys::path::append(moduleDir, std::to_string((int)pCRC[i]));
669 }
670
671 mModuleCacheDir = moduleDir;
672 }
673
674 /// notifyObjectCompiled - Provides a pointer to compiled code for Module M.
675 void JitCache::notifyObjectCompiled(const llvm::Module* M, llvm::MemoryBufferRef Obj)
676 {
677 const std::string& moduleID = M->getModuleIdentifier();
678 if (!moduleID.length())
679 {
680 return;
681 }
682
683 if (!mModuleCacheDir.size())
684 {
685 SWR_INVALID("Unset module cache directory");
686 return;
687 }
688
689 if (!llvm::sys::fs::exists(mModuleCacheDir.str()) &&
690 llvm::sys::fs::create_directories(mModuleCacheDir.str()))
691 {
692 SWR_INVALID("Unable to create directory: %s", mModuleCacheDir.c_str());
693 return;
694 }
695
696 JitCacheFileHeader header;
697
698 llvm::SmallString<MAX_PATH> filePath = mModuleCacheDir;
699 llvm::sys::path::append(filePath, moduleID);
700
701 llvm::SmallString<MAX_PATH> objPath = filePath;
702 objPath += JIT_OBJ_EXT;
703
704 {
705 std::error_code err;
706 llvm::raw_fd_ostream fileObj(objPath.c_str(), err, llvm::sys::fs::F_None);
707 fileObj << Obj.getBuffer();
708 fileObj.flush();
709 }
710
711
712 {
713 std::error_code err;
714 llvm::raw_fd_ostream fileObj(filePath.c_str(), err, llvm::sys::fs::F_None);
715
716 uint32_t objcrc = ComputeCRC(0, Obj.getBufferStart(), Obj.getBufferSize());
717
718 header.Init(mCurrentModuleCRC, objcrc, moduleID, mCpu, mOptLevel, Obj.getBufferSize());
719
720 fileObj.write((const char*)&header, sizeof(header));
721 fileObj.flush();
722 }
723 }
724
725 /// Returns a pointer to a newly allocated MemoryBuffer that contains the
726 /// object which corresponds with Module M, or 0 if an object is not
727 /// available.
728 std::unique_ptr<llvm::MemoryBuffer> JitCache::getObject(const llvm::Module* M)
729 {
730 const std::string& moduleID = M->getModuleIdentifier();
731 mCurrentModuleCRC = ComputeModuleCRC(M);
732
733 if (!moduleID.length())
734 {
735 return nullptr;
736 }
737
738 CalcModuleCacheDir();
739
740 if (!llvm::sys::fs::exists(mModuleCacheDir))
741 {
742 return nullptr;
743 }
744
745 llvm::SmallString<MAX_PATH> filePath = mModuleCacheDir;
746 llvm::sys::path::append(filePath, moduleID);
747
748 llvm::SmallString<MAX_PATH> objFilePath = filePath;
749 objFilePath += JIT_OBJ_EXT;
750
751 FILE* fpObjIn = nullptr;
752 FILE* fpIn = fopen(filePath.c_str(), "rb");
753 if (!fpIn)
754 {
755 return nullptr;
756 }
757
758 std::unique_ptr<llvm::MemoryBuffer> pBuf = nullptr;
759 do
760 {
761 JitCacheFileHeader header;
762 if (!fread(&header, sizeof(header), 1, fpIn))
763 {
764 break;
765 }
766
767 if (!header.IsValid(mCurrentModuleCRC, moduleID, mCpu, mOptLevel))
768 {
769 break;
770 }
771
772 fpObjIn = fopen(objFilePath.c_str(), "rb");
773 if (!fpObjIn)
774 {
775 break;
776 }
777
778 #if LLVM_VERSION_MAJOR < 6
779 pBuf = llvm::MemoryBuffer::getNewUninitMemBuffer(size_t(header.GetObjectSize()));
780 #else
781 pBuf = llvm::WritableMemoryBuffer::getNewUninitMemBuffer(size_t(header.GetObjectSize()));
782 #endif
783 if (!fread(const_cast<char*>(pBuf->getBufferStart()), header.GetObjectSize(), 1, fpObjIn))
784 {
785 pBuf = nullptr;
786 break;
787 }
788
789 if (header.GetObjectCRC() != ComputeCRC(0, pBuf->getBufferStart(), pBuf->getBufferSize()))
790 {
791 SWR_TRACE("Invalid object cache file, ignoring: %s", filePath.c_str());
792 pBuf = nullptr;
793 break;
794 }
795
796 } while (0);
797
798 fclose(fpIn);
799
800 if (fpObjIn)
801 {
802 fclose(fpObjIn);
803 }
804
805
806 return pBuf;
807 }
808
809 void InterleaveAssemblyAnnotater::emitInstructionAnnot(const llvm::Instruction* pInst,
810 llvm::formatted_raw_ostream& OS)
811 {
812 auto dbgLoc = pInst->getDebugLoc();
813 if (dbgLoc)
814 {
815 unsigned int line = dbgLoc.getLine();
816 if (line != mCurrentLineNo)
817 {
818 if (line > 0 && line <= mAssembly.size())
819 {
820 // HACK: here we assume that OS is a formatted_raw_ostream(ods())
821 // and modify the color accordingly. We can't do the color
822 // modification on OS because formatted_raw_ostream strips
823 // the color information. The only way to fix this behavior
824 // is to patch LLVM.
825 OS << "\n; " << line << ": " << mAssembly[line - 1] << "\n";
826 }
827 mCurrentLineNo = line;
828 }
829 }
830 }