mxnet
|
#include "mxnet/base.h"
#include "mxnet/op_attr_types.h"
#include <cuda.h>
#include <cuda_runtime_api.h>
#include <mutex>
#include <string>
#include <vector>
Go to the source code of this file.
Namespaces | |
mxnet | |
namespace of mxnet | |
mxnet::common | |
mxnet::common::cuda | |
common utils for cuda | |
mxnet::common::cuda::rtc | |
mxnet::common::cuda::rtc::util | |
Functions | |
std::string | mxnet::common::cuda::rtc::util::to_string (OpReqType req) |
Convert OpReqType to string. More... | |
int | mxnet::common::cuda::rtc::GetMaxSupportedArch () |
CUfunction | mxnet::common::cuda::rtc::get_function (const std::string ¶meters, const std::string &kernel_name, const std::string &code, int dev_id) |
Compile and get the GPU kernel. Uses cache in order to eliminate the overhead of compilation. More... | |
void | mxnet::common::cuda::rtc::launch (CUfunction function, const dim3 grid_dim, const dim3 block_dim, unsigned int shared_mem_bytes, mshadow::Stream< gpu > *stream, std::vector< const void * > *args) |
Launch a GPU kernel. More... | |
Variables | |
std::mutex | mxnet::common::cuda::rtc::lock |