Tensor Comprehensions
|
Namespaces | |
detail | |
Classes | |
class | GeneticAutotunerATen |
class | GeneticSearch |
class | BoolParameter |
class | RangeParameter |
class | ParameterView |
class | SchedulerOptionsParameters |
class | MultiRangeParams |
class | TilingParameters |
class | CudaDimParameters |
class | TuningConfiguration |
class | TuningParameterFixer |
class | CandidateConfiguration |
class | ConcurrentQueue |
class | Printer |
struct | OptionsWithMedianTime |
Typedefs | |
using | TimePoint = std::chrono::high_resolution_clock::time_point |
using | Duration = std::chrono::high_resolution_clock::duration |
Functions | |
template<typename Vector , typename... Vectors> | |
Vector | mergeVectors (Vector &&v, Vectors &&...vs) |
std::vector< std::size_t > | powers2andCeilDivisors (std::size_t val) |
std::vector < OptionsWithMedianTime > | getOptionsAndMedianRuntimes (const std::string &id, const std::vector< const DLTensor * > &inputs) |
std::vector< MappingOptions > | restoreCandidates (const std::string &id, const std::vector< const DLTensor * > &inputs, const std::vector< const DLTensor * > &outputs) |
llvm::Optional< MappingOptions > | getBestOptions (const std::string &id, const std::vector< const DLTensor * > &inputs, const std::vector< const DLTensor * > &outputs) |
using tc::autotune::Duration = typedef std::chrono::high_resolution_clock::duration |
using tc::autotune::TimePoint = typedef std::chrono::high_resolution_clock::time_point |
llvm::Optional<MappingOptions> tc::autotune::getBestOptions | ( | const std::string & | id, |
const std::vector< const DLTensor * > & | inputs, | ||
const std::vector< const DLTensor * > & | outputs | ||
) |
std::vector<OptionsWithMedianTime> tc::autotune::getOptionsAndMedianRuntimes | ( | const std::string & | id, |
const std::vector< const DLTensor * > & | inputs | ||
) |
Vector tc::autotune::mergeVectors | ( | Vector && | v, |
Vectors &&... | vs | ||
) |
std::vector<std::size_t> tc::autotune::powers2andCeilDivisors | ( | std::size_t | val | ) |
Returns all the powers of 2 up to the first one that is larger than val and the result of ceil(val/pow2) for each of those powers of 2 (except for the larger one)
std::vector<MappingOptions> tc::autotune::restoreCandidates | ( | const std::string & | id, |
const std::vector< const DLTensor * > & | inputs, | ||
const std::vector< const DLTensor * > & | outputs | ||
) |