11#ifndef PROTEUS_JITENGINEDEVICECUDA_HPP
12#define PROTEUS_JITENGINEDEVICECUDA_HPP
16#include <llvm/ADT/DenseMap.h>
17#include <llvm/ADT/SmallVector.h>
24class JitEngineDeviceCUDA;
43 SmallVectorImpl<char> &PTXStr);
51 dim3 BlockDim,
void **KernelArgs,
52 uint64_t ShmemSize, CUstream Stream);
61 void extractLinkedBitcode(LLVMContext &Ctx, CUmodule &CUMod,
62 SmallVector<std::unique_ptr<Module>> &LinkedModules,
void const char * ModuleId
Definition CompilerInterfaceDevice.cpp:31
void char * KernelName
Definition CompilerInterfaceDevice.cpp:50
Definition JitEngineDevice.hpp:78
Definition Hashing.hpp:19
Definition JitEngineDeviceCUDA.hpp:31
std::unique_ptr< Module > extractModule(BinaryInfo &BinInfo)
Definition JitEngineDeviceCUDA.cpp:98
static JitEngineDeviceCUDA & instance()
Definition JitEngineDeviceCUDA.cpp:27
void codegenPTX(Module &M, StringRef DeviceArch, SmallVectorImpl< char > &PTXStr)
std::unique_ptr< MemoryBuffer > codegenObject(Module &M, StringRef DeviceArch)
Definition JitEngineDeviceCUDA.cpp:145
void setLaunchBoundsForKernel(Module &M, Function &F, size_t GridSize, int BlockSize)
Definition JitEngineDeviceCUDA.cpp:123
HashT getModuleHash(BinaryInfo &BinInfo)
Definition JitEngineDeviceCUDA.cpp:61
void * resolveDeviceGlobalAddr(const void *Addr)
Definition JitEngineDeviceCUDA.cpp:23
cudaError_t launchKernelFunction(CUfunction KernelFunc, dim3 GridDim, dim3 BlockDim, void **KernelArgs, uint64_t ShmemSize, CUstream Stream)
Definition JitEngineDeviceCUDA.cpp:137
CUfunction getKernelFunctionFromImage(StringRef KernelName, const void *Image)
Definition JitEngineDeviceCUDA.cpp:129
Definition JitEngineDevice.hpp:176
std::string DeviceArch
Definition JitEngineDevice.hpp:385
Definition JitEngine.cpp:20
CUfunction KernelFunction_t
Definition JitEngineDeviceCUDA.hpp:28
CUstream DeviceStream_t
Definition JitEngineDeviceCUDA.hpp:27
cudaError_t DeviceError_t
Definition JitEngineDeviceCUDA.hpp:26
Definition JitEngineDevice.hpp:174