Proteus
Programmable JIT compilation and optimization for C/C++ using LLVM
Loading...
Searching...
No Matches
JitEngineDeviceCUDA.hpp
Go to the documentation of this file.
1//===-- JitEngineDeviceCUDA.hpp -- JIT Engine Device for CUDA header --===//
2//
3// Part of the Proteus Project, under the Apache License v2.0 with LLVM
4// Exceptions. See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9//===----------------------------------------------------------------------===//
10
11#ifndef PROTEUS_JITENGINEDEVICECUDA_HPP
12#define PROTEUS_JITENGINEDEVICECUDA_HPP
13
15#include "proteus/Utils.h"
16#include <llvm/ADT/DenseMap.h>
17#include <llvm/ADT/SmallVector.h>
18#include <memory>
19
20namespace proteus {
21
22using namespace llvm;
23
25template <> struct DeviceTraits<JitEngineDeviceCUDA> {
26 using DeviceError_t = cudaError_t;
27 using DeviceStream_t = CUstream;
28 using KernelFunction_t = CUfunction;
29};
30
31class JitEngineDeviceCUDA : public JitEngineDevice<JitEngineDeviceCUDA> {
32public:
34
35 void *resolveDeviceGlobalAddr(const void *Addr);
36
37 void setLaunchBoundsForKernel(Module &M, Function &F, size_t GridSize,
38 int BlockSize);
39
40 void extractModules(BinaryInfo &BinInfo);
41
42 std::unique_ptr<Module> tryExtractKernelModule(BinaryInfo &BinInfo,
43 StringRef KernelName,
44 LLVMContext &Ctx);
45
46 void codegenPTX(Module &M, StringRef DeviceArch,
47 SmallVectorImpl<char> &PTXStr);
48
49 CUfunction getKernelFunctionFromImage(StringRef KernelName,
50 const void *Image);
51
52 cudaError_t launchKernelFunction(CUfunction KernelFunc, dim3 GridDim,
53 dim3 BlockDim, void **KernelArgs,
54 uint64_t ShmemSize, CUstream Stream);
55
57
58 std::unique_ptr<MemoryBuffer> compileOnly(Module &M);
59
60private:
64
65 void extractLinkedBitcode(LLVMContext &Ctx, CUmodule &CUMod,
66 SmallVector<std::unique_ptr<Module>> &LinkedModules,
67 std::string &ModuleId);
68};
69
70} // namespace proteus
71
72#endif
void const char * ModuleId
Definition CompilerInterfaceDevice.cpp:31
void char * KernelName
Definition CompilerInterfaceDevice.cpp:50
Definition JitEngineDevice.hpp:79
Definition Hashing.hpp:20
Definition JitEngineDeviceCUDA.hpp:31
std::unique_ptr< MemoryBuffer > compileOnly(Module &M)
Definition JitEngineDeviceCUDA.cpp:182
static JitEngineDeviceCUDA & instance()
Definition JitEngineDeviceCUDA.cpp:27
void setLaunchBoundsForKernel(Module &M, Function &F, size_t GridSize, int BlockSize)
void extractModules(BinaryInfo &BinInfo)
Definition JitEngineDeviceCUDA.cpp:114
void codegenPTX(Module &M, StringRef DeviceArch, SmallVectorImpl< char > &PTXStr)
HashT getModuleHash(BinaryInfo &BinInfo)
Definition JitEngineDeviceCUDA.cpp:69
std::unique_ptr< Module > tryExtractKernelModule(BinaryInfo &BinInfo, StringRef KernelName, LLVMContext &Ctx)
Definition JitEngineDeviceCUDA.cpp:106
void * resolveDeviceGlobalAddr(const void *Addr)
Definition JitEngineDeviceCUDA.cpp:23
cudaError_t launchKernelFunction(CUfunction KernelFunc, dim3 GridDim, dim3 BlockDim, void **KernelArgs, uint64_t ShmemSize, CUstream Stream)
Definition JitEngineDeviceCUDA.cpp:147
CUfunction getKernelFunctionFromImage(StringRef KernelName, const void *Image)
Definition JitEngineDeviceCUDA.cpp:139
Definition JitEngineDevice.hpp:245
std::string DeviceArch
Definition JitEngineDevice.hpp:525
Definition Helpers.h:76
Definition CppJitModule.cpp:21
CUfunction KernelFunction_t
Definition JitEngineDeviceCUDA.hpp:28
CUstream DeviceStream_t
Definition JitEngineDeviceCUDA.hpp:27
cudaError_t DeviceError_t
Definition JitEngineDeviceCUDA.hpp:26
Definition JitEngineDevice.hpp:243