24 #include <dlpack/dlpack.h>
31 const std::string& TCDefinition,
32 const std::vector<const DLTensor*>& inputsInfo);
35 const std::vector<const DLTensor*>& inputsInfo);
68 const std::vector<const DLTensor*>& inputs,
69 const std::vector<DLTensor*>& outputs,
70 bool profile =
false)
const;
78 const std::vector<const void*>& inputs,
79 const std::vector<void*>& outputs)
const;
130 const std::vector<const DLTensor*>& inputsInfo)
const;
Block block() const
Definition: tc_executor.h:122
std::string getCudaSource()
Definition: tc_executor.h:81
std::shared_ptr< CudaRTCFunction > rtcFun
Definition: tc_executor.h:115
Specializing CudaDim to differentiate between Block and Grid sizes.
Definition: mapping_options.h:208
TcExecutor(const std::string &TCDefinition, const std::vector< const DLTensor * > &inputsInfo)
std::unique_ptr< tc::MappingOptions > options
Definition: tc_executor.h:111
std::string kernelSpecializedName
Definition: tc_executor.h:110
std::vector< dlutils::DLTensorUPtr > inputsInfo
Definition: tc_executor.h:107
Definition: tc2halide.h:29
std::vector< const DLTensor * > inferOutputTensorInfo()
void uncheckedRun(const std::vector< const void * > &inputs, const std::vector< void * > &outputs) const
isl::ctx ctx_
Definition: tc_executor.h:134
std::vector< int > kernelParams
Definition: tc_executor.h:109
void compileWithTcMapper()
void clearRTC()
Definition: tc_executor.h:91
lang::TreeRef tcTree_
Definition: tc_executor.h:133
void compile(const tc::MappingOptions &options)
std::vector< dlutils::DLTensorUPtr > outputsInfo
Definition: tc_executor.h:108
std::string kernelName
Definition: tc_executor.h:106
std::string cudaSource
Definition: tc_executor.h:112
Definition: mapping_options.h:336
std::chrono::high_resolution_clock::duration Duration
Definition: rtc.h:31
bool hasRTCFun()
Definition: tc_executor.h:85
void checkInputsCompliant(const std::vector< const DLTensor * > &inputsInfo) const
Duration run(const std::vector< const DLTensor * > &inputs, const std::vector< DLTensor * > &outputs, bool profile=false) const
static const size_t InvalidHandle
Definition: tc_executor.h:126
tc2halide::HalideComponents halideComponents_
Definition: tc_executor.h:131
TcExecutionInfo execInfo_
Definition: tc_executor.h:132
TcExecutor & operator=(TcExecutor &&)=delete
Block block
Definition: tc_executor.h:114
Specializing CudaDim to differentiate between Block and Grid sizes.
Definition: mapping_options.h:196
Grid grid() const
Definition: tc_executor.h:119
std::string kernelName() const
Definition: tc_executor.h:98
Grid grid
Definition: tc_executor.h:113
std::shared_ptr< Tree > TreeRef
Definition: tree.h:44
Definition: tc_executor.h:105
Definition: tc_executor.h:28