mxnet
|
Classes | |
struct | dnnl_version_t |
Macros | |
#define | DNNL_RUNTIME_NONE 0u |
No runtime (disabled) More... | |
#define | DNNL_RUNTIME_SEQ 1u |
Sequential runtime (CPU only) More... | |
#define | DNNL_RUNTIME_OMP 2u |
OpenMP runtime (CPU only) More... | |
#define | DNNL_RUNTIME_TBB 4u |
TBB runtime (CPU only) More... | |
#define | DNNL_RUNTIME_THREADPOOL 8u |
Threadpool runtime (CPU only) More... | |
#define | DNNL_RUNTIME_OCL 256u |
OpenCL runtime. More... | |
#define | DNNL_RUNTIME_SYCL 512u |
SYCL runtime. More... | |
#define | DNNL_RUNTIME_DPCPP DNNL_RUNTIME_SYCL |
DPC++ runtime. More... | |
#define | DNNL_JIT_PROFILE_NONE 0u |
Disable profiling completely. More... | |
#define | DNNL_JIT_PROFILE_VTUNE 1u |
Enable VTune Amplifier integration. More... | |
#define | DNNL_JIT_PROFILE_LINUX_PERFMAP 2u |
Enable Linux perf integration via perfmap files. More... | |
#define | DNNL_JIT_PROFILE_LINUX_JITDUMP 4u |
Enable Linux perf integration via jitdump files. More... | |
#define | DNNL_JIT_PROFILE_LINUX_JITDUMP_USE_TSC 8u |
#define | DNNL_JIT_PROFILE_LINUX_PERF (DNNL_JIT_PROFILE_LINUX_JITDUMP | DNNL_JIT_PROFILE_LINUX_PERFMAP) |
Enable Linux perf integration (both jitdump and perfmap) More... | |
Enumerations | |
enum | dnnl_cpu_isa_t { dnnl_cpu_isa_all = 0x0, dnnl_cpu_isa_sse41 = 0x1, dnnl_cpu_isa_avx = 0x3, dnnl_cpu_isa_avx2 = 0x7, dnnl_cpu_isa_avx512_mic = 0xf, dnnl_cpu_isa_avx512_mic_4ops = 0x1f, dnnl_cpu_isa_avx512_core = 0x27, dnnl_cpu_isa_avx512_core_vnni = 0x67, dnnl_cpu_isa_avx512_core_bf16 = 0xe7, dnnl_cpu_isa_avx512_core_amx = 0x3e7, dnnl_cpu_isa_avx2_vnni = 0x407 } |
CPU instruction set flags. More... | |
enum | dnnl_cpu_isa_hints_t { dnnl_cpu_isa_no_hints = 0x0, dnnl_cpu_isa_prefer_ymm = 0x1 } |
CPU ISA hints flags. More... | |
Functions | |
dnnl_status_t DNNL_API | dnnl_set_verbose (int level) |
dnnl_status_t DNNL_API | dnnl_set_jit_dump (int enable) |
const dnnl_version_t DNNL_API * | dnnl_version (void) |
dnnl_status_t DNNL_API | dnnl_set_jit_profiling_flags (unsigned flags) |
dnnl_status_t DNNL_API | dnnl_set_jit_profiling_jitdumpdir (const char *dir) |
dnnl_status_t DNNL_API | dnnl_set_max_cpu_isa (dnnl_cpu_isa_t isa) |
dnnl_cpu_isa_t DNNL_API | dnnl_get_effective_cpu_isa (void) |
dnnl_status_t DNNL_API | dnnl_set_cpu_isa_hints (dnnl_cpu_isa_hints_t isa_hints) |
dnnl_cpu_isa_hints_t DNNL_API | dnnl_get_cpu_isa_hints (void) |
#define DNNL_JIT_PROFILE_LINUX_JITDUMP 4u |
Enable Linux perf integration via jitdump files.
#define DNNL_JIT_PROFILE_LINUX_JITDUMP_USE_TSC 8u |
Instruct Linux perf integration via jitdump files to use TSC. DNNL_JIT_PROFILE_LINUX_JITDUMP must be set too for this to take effect.
#define DNNL_JIT_PROFILE_LINUX_PERF (DNNL_JIT_PROFILE_LINUX_JITDUMP | DNNL_JIT_PROFILE_LINUX_PERFMAP) |
Enable Linux perf integration (both jitdump and perfmap)
#define DNNL_JIT_PROFILE_LINUX_PERFMAP 2u |
Enable Linux perf integration via perfmap files.
#define DNNL_JIT_PROFILE_NONE 0u |
Disable profiling completely.
#define DNNL_JIT_PROFILE_VTUNE 1u |
Enable VTune Amplifier integration.
#define DNNL_RUNTIME_DPCPP DNNL_RUNTIME_SYCL |
DPC++ runtime.
#define DNNL_RUNTIME_NONE 0u |
No runtime (disabled)
#define DNNL_RUNTIME_OCL 256u |
OpenCL runtime.
#define DNNL_RUNTIME_OMP 2u |
OpenMP runtime (CPU only)
#define DNNL_RUNTIME_SEQ 1u |
Sequential runtime (CPU only)
#define DNNL_RUNTIME_SYCL 512u |
SYCL runtime.
#define DNNL_RUNTIME_TBB 4u |
TBB runtime (CPU only)
#define DNNL_RUNTIME_THREADPOOL 8u |
Threadpool runtime (CPU only)
enum dnnl_cpu_isa_hints_t |
enum dnnl_cpu_isa_t |
CPU instruction set flags.
dnnl_cpu_isa_hints_t DNNL_API dnnl_get_cpu_isa_hints | ( | void | ) |
Gets the ISA specific hints that library can follow. See dnnl_cpu_isa_hints_t and #dnnl::cpu_isa_hints for the list of the values returned by the C and C++ API functions respectively.
dnnl_cpu_isa_t DNNL_API dnnl_get_effective_cpu_isa | ( | void | ) |
Gets the maximal ISA the library can dispatch to on the CPU. See dnnl_cpu_isa_t and #dnnl::cpu_isa for the list of the values returned by the C and C++ API functions respectively.
dnnl_status_t DNNL_API dnnl_set_cpu_isa_hints | ( | dnnl_cpu_isa_hints_t | isa_hints | ) |
Sets the hints flag for the CPU ISA. See dnnl_cpu_isa_hints_t and #dnnl::cpu_isa_hints for the list of the values accepted by the C and C++ API functions respectively.
This function has effect only once, and returns an error on subsequent calls. It should also be invoked before any other oneDNN API call, otherwise it may return an error.
This function overrides the DNNL_CPU_ISA_HINTS environment variable.
isa_hints | CPU ISA hints to be passed over to the implementation. Pass dnnl_cpu_isa_no_hints/#dnnl::cpu_isa_hints::no_hints to use default features i.e. no hints. |
dnnl_status_t DNNL_API dnnl_set_jit_dump | ( | int | enable | ) |
Configures dumping of JIT-generated code.
enable | Flag value. Set to 0 to disable and set to 1 to enable. |
flag
value is invalid, and dnnl_success/#dnnl::status::success on success. dnnl_status_t DNNL_API dnnl_set_jit_profiling_flags | ( | unsigned | flags | ) |
Sets library profiling flags. The flags define which profilers are supported.
flags | Profiling flags that can contain the following bits:
|
Passing DNNL_JIT_PROFILE_NONE disables profiling completely.
flags
value is invalid, and dnnl_success/#dnnl::status::success on success. dnnl_status_t DNNL_API dnnl_set_jit_profiling_jitdumpdir | ( | const char * | dir | ) |
Sets JIT dump output path. Only applicable to Linux and is only used when profiling flags have DNNL_JIT_PROFILE_LINUX_PERF bit set.
After the first JIT kernel is generated, the jitdump output will be placed into temporary directory created using the mkdtemp template 'dir/.debug/jit/dnnl.XXXXXX'.
dir | JIT dump output path. |
dnnl_status_t DNNL_API dnnl_set_max_cpu_isa | ( | dnnl_cpu_isa_t | isa | ) |
Sets the maximal ISA the library can dispatch to on the CPU. See dnnl_cpu_isa_t and #dnnl::cpu_isa for the list of the values accepted by the C and C++ API functions respectively.
This function has effect only once, and returns an error on subsequent calls. It should also be invoked before any other oneDNN API call, otherwise it may return an error.
This function overrides the DNNL_MAX_CPU_ISA environment variable. The environment variable can be set to the desired maximal ISA name in upper case and with dnnl_cpu_isa prefix removed. For example: DNNL_MAX_CPU_ISA=AVX2
.
isa | Maximal ISA the library should dispatch to. Pass dnnl_cpu_isa_all/#dnnl::cpu_isa::all to remove ISA restrictions (except for ISAs with initial support in the library). |
isa
parameter is invalid or the ISA cannot be changed at this time. dnnl_status_t DNNL_API dnnl_set_verbose | ( | int | level | ) |
Configures verbose output to stdout.
level | Verbosity level:
|
level
value is invalid, and dnnl_success/#dnnl::status::success on success. const dnnl_version_t DNNL_API* dnnl_version | ( | void | ) |
Returns library version information.