docs/api/3rdparty_2mshadow_2mshadow_2base_8h_source.html

/*

 * Licensed to the Apache Software Foundation (ASF) under one

 * or more contributor license agreements.  See the NOTICE file

 * distributed with this work for additional information

 * regarding copyright ownership.  The ASF licenses this file

 * to you under the Apache License, Version 2.0 (the

 * "License"); you may not use this file except in compliance

 * with the License.  You may obtain a copy of the License at

 *

 *   http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing,

 * software distributed under the License is distributed on an

 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

 * KIND, either express or implied.  See the License for the

 * specific language governing permissions and limitations

 * under the License.

 */


#ifndef MSHADOW_BASE_H_

#define MSHADOW_BASE_H_

#ifdef _MSC_VER

#ifndef _CRT_SECURE_NO_WARNINGS

#define _CRT_SECURE_NO_WARNINGS

#endif

#ifndef _CRT_SECURE_NO_DEPRECATE

#define _CRT_SECURE_NO_DEPRECATE

#endif

#ifndef NOMINMAX

#define NOMINMAX

#endif

#endif

#include <algorithm>

#include <cfloat>

#include <climits>

#include <cmath>

#include <cstdio>

#include <functional>

#include <limits>

#include <sstream>

#include <string>


#ifdef _MSC_VER

typedef signed char int8_t;

typedef __int16 int16_t;

typedef __int32 int32_t;

typedef __int64 int64_t;

typedef unsigned char uint8_t;

typedef unsigned __int16 uint16_t;

typedef unsigned __int32 uint32_t;

typedef unsigned __int64 uint64_t;

#else

#include <inttypes.h>

#endif

// macro defintiions

#ifndef MSHADOW_STAND_ALONE

#define MSHADOW_STAND_ALONE 0

#endif


#ifndef MSHADOW_ALLOC_PAD

#define MSHADOW_ALLOC_PAD true

#endif


#ifndef MSHADOW_MIN_PAD_RATIO

  #define MSHADOW_MIN_PAD_RATIO 2

#endif


#if MSHADOW_STAND_ALONE

  #define MSHADOW_USE_CBLAS 0

  #define MSHADOW_USE_MKL   0

  #define MSHADOW_USE_CUDA  0

#endif


#ifndef MSHADOW_FORCE_STREAM

#define MSHADOW_FORCE_STREAM 1

#endif


#ifndef MSHADOW_USE_CBLAS

  #define MSHADOW_USE_CBLAS 0

#endif


#ifndef MSHADOW_USE_MKL

  #define MSHADOW_USE_MKL   1

#endif


#ifndef MSHADOW_USE_CUDA

  #define MSHADOW_USE_CUDA   1

#endif


#ifndef MSHADOW_USE_CUDNN

  #define MSHADOW_USE_CUDNN 0

#endif


#ifndef MSHADOW_USE_CUTENSOR

  #define MSHADOW_USE_CUTENSOR 0

#endif


#ifndef MSHADOW_USE_CUSOLVER

  #define MSHADOW_USE_CUSOLVER MSHADOW_USE_CUDA

#endif


#ifndef MSHADOW_OLD_CUDA

#define MSHADOW_OLD_CUDA 0

#endif


#ifndef MSHADOW_USE_SSE

  #define MSHADOW_USE_SSE 1

#endif


#ifndef MSHADOW_USE_F16C

  #if defined(_MSC_VER) || defined(__CUDACC__)

    #define MSHADOW_USE_F16C 0

  #elif defined(__clang__) && \

        ((__clang_major__ < 8) || ((__clang_major__ == 8) && (__clang_minor__ < 1)))

    #define MSHADOW_USE_F16C 0

  #else

    #define MSHADOW_USE_F16C 1

  #endif

#endif


#ifndef MSHADOW_USE_NVML

  #define MSHADOW_USE_NVML 0

#endif

// SSE is conflict with cudacc

#ifdef __CUDACC__

  #undef MSHADOW_USE_SSE

  #define MSHADOW_USE_SSE 0

#endif


#if MSHADOW_USE_CBLAS

extern "C" {

    #include <cblas.h>

}

#elif MSHADOW_USE_MKL

  #if MSHADOW_INT64_TENSOR_SIZE == 1

    // Define MKL_INT here to use exactly the same 64bits integer type definitions.

    // If MKL_INT will not be defined here, the mkl header defines it as long long int.

    #define MKL_INT int64_t

    #define MKL_UINT uint64_t

  #endif

  #include <mkl_blas.h>

  #include <mkl_cblas.h>

  #include <mkl_vsl.h>

  #include <mkl_vsl_functions.h>

  #include <mkl_version.h>

#endif


#if MSHADOW_USE_CUDA

  #include <cuda.h>

  #include <cublas_v2.h>

  #include <curand.h>

#endif


#if MSHADOW_USE_CUDNN == 1

  #include <cudnn.h>

#endif


#if MSHADOW_USE_CUTENSOR == 1

  #include <cutensor.h>

#endif


#if MSHADOW_USE_CUSOLVER == 1

  #include <cusolverDn.h>

#endif


#if MSHADOW_USE_NVML

  #include <nvml.h>

#endif


// --------------------------------

// MSHADOW_XINLINE is used for inlining template code for both CUDA and CPU code

#ifdef MSHADOW_XINLINE

  #error "MSHADOW_XINLINE must not be defined"

#endif

#ifdef _MSC_VER

#define MSHADOW_FORCE_INLINE __forceinline

#pragma warning(disable : 4068)

#else

#define MSHADOW_FORCE_INLINE inline __attribute__((always_inline))

#endif

#ifdef __CUDACC__

  #define MSHADOW_XINLINE MSHADOW_FORCE_INLINE __device__ __host__

#else

  #define MSHADOW_XINLINE MSHADOW_FORCE_INLINE

#endif


#define MSHADOW_CINLINE MSHADOW_FORCE_INLINE


#ifndef MSHADOW_DEFAULT_DTYPE

#define MSHADOW_DEFAULT_DTYPE = ::mshadow::default_real_t

#endif


#ifndef MSHADOW_USE_GLOG

#define MSHADOW_USE_GLOG DMLC_USE_GLOG

#endif  // MSHADOW_USE_GLOG


#define MSHADOW_THROW_EXCEPTION noexcept(false)

#define MSHADOW_NO_EXCEPTION  noexcept(true)


#if defined(_MSC_VER)

#define MSHADOW_ALIGNED(x) __declspec(align(x))

#else

#define MSHADOW_ALIGNED(x) __attribute__ ((aligned(x)))

#endif


#define MSHADOW_CUDA_CALL(func)                                    \

  {                                                                \

    cudaError_t e = (func);                                        \

    if (e == cudaErrorCudartUnloading) {                           \

      throw dmlc::Error(cudaGetErrorString(e));                    \

    }                                                              \

    CHECK_EQ(e, cudaSuccess)                                       \

        << "CUDA: " << cudaGetErrorString(e);                      \

  }


#define MSHADOW_CATCH_ERROR(func)                                     \

  {                                                                   \

    try {                                                             \

      (func);                                                         \

    } catch (const dmlc::Error &e) {                                    \

      std::string what = e.what();                                      \

      if (what.find("driver shutting down") == std::string::npos) {     \

        LOG(ERROR) << "Ignore CUDA Error " << what;                     \

      }                                                                 \

    }                                                                   \

  }


#include "./half.h"

#include "./bfloat.h"

#define MSHADOW_HALF_BF_OPERATOR(RTYPE, OP)                                               \

  MSHADOW_XINLINE RTYPE operator OP(mshadow::half::half_t a, mshadow::bfloat::bf16_t b) { \

    return float(a) OP float(b); /* NOLINT(*) */                                          \

  }                                                                                       \

  MSHADOW_XINLINE RTYPE operator OP(mshadow::bfloat::bf16_t a, mshadow::half::half_t b) { \

    return float(a) OP float(b); /* NOLINT(*) */                                          \

  }


MSHADOW_HALF_BF_OPERATOR(float, +)

MSHADOW_HALF_BF_OPERATOR(float, -)

MSHADOW_HALF_BF_OPERATOR(float, *)

MSHADOW_HALF_BF_OPERATOR(float, /)

MSHADOW_HALF_BF_OPERATOR(bool, >)

MSHADOW_HALF_BF_OPERATOR(bool, <)

MSHADOW_HALF_BF_OPERATOR(bool, >=)

MSHADOW_HALF_BF_OPERATOR(bool, <=)


#include "dmlc/logging.h"


namespace mshadow {

const unsigned kRandBufferSize = 1000000;

const float kPi = 3.1415926f;

#if MSHADOW_INT64_TENSOR_SIZE == 1

  typedef int64_t index_t;

#else

  typedef int32_t index_t;

#endif


#ifdef _WIN32


  typedef int64_t openmp_index_t;

#else


  typedef index_t openmp_index_t;

#endif


#if (MSHADOW_USE_MKL && MXNET_USE_LAPACK) || MXNET_USE_ILP64_LAPACKE

  // lapack_index_t could be replaced by index_t and removed when all blas library support large tensor

  typedef index_t lapack_index_t;

#else

  typedef int lapack_index_t;

#endif


typedef float default_real_t;


enum TypeFlag {

  kFloat32 = 0,

  kFloat64 = 1,

  kFloat16 = 2,

  kUint8 = 3,

  kInt32 = 4,

  kInt8  = 5,

  kInt64 = 6,

  kBool = 7,

  kInt16 = 8,

  kUint16 = 9,

  kUint32 = 10,

  kUint64 = 11,

  kBfloat16 = 12

};


template<typename DType>

struct DataType;


template<>

struct DataType<float> {

  static const int kFlag = kFloat32;

  static const int kLanes = 1;

#if MSHADOW_USE_CUDA

#if (CUDA_VERSION >= 8000)

  static const cudaDataType_t kCudaFlag = CUDA_R_32F;

#endif

#if MSHADOW_USE_CUDNN

  static const cudnnDataType_t kCudnnFlag = CUDNN_DATA_FLOAT;

  typedef float ScaleType;

#endif

#endif

};

template<>

struct DataType<double> {

  static const int kFlag = kFloat64;

  static const int kLanes = 1;

#if MSHADOW_USE_CUDA

#if (CUDA_VERSION >= 8000)

  static const cudaDataType_t kCudaFlag = CUDA_R_64F;

#endif

#if MSHADOW_USE_CUDNN

  static const cudnnDataType_t kCudnnFlag = CUDNN_DATA_DOUBLE;

  typedef double ScaleType;

#endif

#endif

};

template<>

struct DataType<half::half_t> {

  static const int kFlag = kFloat16;

  static const int kLanes = 1;

#if MSHADOW_USE_CUDA

#if (CUDA_VERSION >= 8000)

  static const cudaDataType_t kCudaFlag = CUDA_R_16F;

#endif

#if MSHADOW_USE_CUDNN

  static const cudnnDataType_t kCudnnFlag = CUDNN_DATA_HALF;

  typedef float ScaleType;

#endif

#endif

};

template <>

struct DataType<bfloat::bf16_t> {

  static const int kFlag = kBfloat16;

  static const int kLanes = 1;

};

template<>

struct DataType<uint8_t> {

  static const int kFlag = kUint8;

  static const int kLanes = 1;

#if MSHADOW_USE_CUDA

#if (CUDA_VERSION >= 8000)

  static const cudaDataType_t kCudaFlag = CUDA_R_8U;

#endif

#if (MSHADOW_USE_CUDNN == 1 && CUDNN_MAJOR >= 6)

  // no uint8 in cudnn for now

  static const cudnnDataType_t kCudnnFlag = CUDNN_DATA_INT8;

  typedef uint8_t ScaleType;

#endif

#endif

};

template<>

struct DataType<int8_t> {

  static const int kFlag = kInt8;

  static const int kLanes = 1;

#if MSHADOW_USE_CUDA

#if (CUDA_VERSION >= 8000)

  static const cudaDataType_t kCudaFlag = CUDA_R_8I;

#endif

#if (MSHADOW_USE_CUDNN == 1 && CUDNN_MAJOR >= 6)

  static const cudnnDataType_t kCudnnFlag = CUDNN_DATA_INT8;

  typedef int8_t ScaleType;

#endif

#endif

};

template<>

struct DataType<int32_t> {

  static const int kFlag = kInt32;

  static const int kLanes = 1;

#if MSHADOW_USE_CUDA

#if (CUDA_VERSION >= 8000)

  static const cudaDataType_t kCudaFlag = CUDA_R_32I;

#endif

#if (MSHADOW_USE_CUDNN == 1 && CUDNN_MAJOR >= 6)

  static const cudnnDataType_t kCudnnFlag = CUDNN_DATA_INT32;

  typedef int32_t ScaleType;

#endif

#endif

};

template<>

struct DataType<int64_t> {

  static const int kFlag = kInt64;

  static const int kLanes = 1;

};

template<>

struct DataType<bool> {

  static const int kFlag = kBool;

  static const int kLanes = 1;

};

template<>

struct DataType<int16_t> {

  static const int kFlag = kInt16;

  static const int kLanes = 1;

};

template<>

struct DataType<uint16_t> {

  static const int kFlag = kUint16;

  static const int kLanes = 1;

};

template<>

struct DataType<uint32_t> {

  static const int kFlag = kUint32;

  static const int kLanes = 1;

};

template<>

struct DataType<uint64_t> {

  static const int kFlag = kUint64;

  static const int kLanes = 1;

};


const int default_type_flag = DataType<default_real_t>::kFlag;


const int index_type_flag = DataType<lapack_index_t>::kFlag;


enum LayoutFlag {

  kUNKNOWN = -1,


  kNCHW = 0,

  kNHWC,

  kCHWN,


  kNCW = 1 << 3,

  kNWC,

  kCWN,


  kNCDHW = 1 << 5,

  kNDHWC,

  kCDHWN

};


inline LayoutFlag layoutFlag(std::string layoutstr) {

  switch (layoutstr.length()) {

    case 4:

      if (layoutstr == "NHWC")

        return kNHWC;

      if (layoutstr == "NCHW")

        return kNCHW;

      if (layoutstr == "CHWN")

        return kCHWN;

      return kUNKNOWN;

    case 3:

      if (layoutstr == "NWC")

        return kNWC;

      if (layoutstr == "NCW")

        return kNCW;

      if (layoutstr == "CWN")

        return kCWN;

      return kUNKNOWN;

    case 5:

      if (layoutstr == "NDHWC")

        return kNDHWC;

      if (layoutstr == "NCDHW")

        return kNCDHW;

      if (layoutstr == "CDHWN")

        return kCDHWN;

      return kUNKNOWN;

    default:

      return kUNKNOWN;

  }

}


inline std::string toString(LayoutFlag layout) {

  switch (layout) {

    case kUNKNOWN:

      return "";

    case kNCHW:

      return "NCHW";

    case kNHWC:

      return "NHWC";

    case kCHWN:

      return "CHWN";

    case kNCW:

      return "NCW";

    case kNWC:

      return "NWC";

    case kCWN:

      return "CWN";

    case kNCDHW:

      return "NCDHW";

    case kNDHWC:

      return "NDHWC";

    case kCDHWN:

      return "CDHWN";

    default:

      return "";

  }

}


template<int layout>

struct LayoutType;


template<>

struct LayoutType<kNCHW> {

  static const index_t kNdim = 4;

#if (MSHADOW_USE_CUDA && MSHADOW_USE_CUDNN == 1 && CUDNN_MAJOR >= 4)

  static const cudnnTensorFormat_t kCudnnFlag = CUDNN_TENSOR_NCHW;

#else

  static const int kCudnnFlag = -1;

#endif

};


template<>

struct LayoutType<kNHWC> {

  static const index_t kNdim = 4;

#if (MSHADOW_USE_CUDA && MSHADOW_USE_CUDNN == 1 && CUDNN_MAJOR >= 4)

  static const cudnnTensorFormat_t kCudnnFlag = CUDNN_TENSOR_NHWC;

#else

  static const int kCudnnFlag = -1;

#endif

};


const int default_layout = kNCHW;


template<>

struct LayoutType<kNCDHW> {

  static const index_t kNdim = 5;

#if (MSHADOW_USE_CUDA && MSHADOW_USE_CUDNN == 1 && CUDNN_MAJOR >= 4)

  static const cudnnTensorFormat_t kCudnnFlag = CUDNN_TENSOR_NCHW;

#else

  static const int kCudnnFlag = -1;

#endif

};


template<>

struct LayoutType<kNDHWC> {

  static const index_t kNdim = 5;

#if (MSHADOW_USE_CUDA && MSHADOW_USE_CUDNN == 1 && CUDNN_MAJOR >= 4)

  static const cudnnTensorFormat_t kCudnnFlag = CUDNN_TENSOR_NHWC;

#else

  static const int kCudnnFlag = -1;

#endif

};


const int default_layout_5d = kNCDHW;


namespace op {

// binary operator

struct mul{

  template<typename DType>

  MSHADOW_XINLINE static DType Map(DType a, DType b) {

    return a * b;

  }

};

struct plus {

  template<typename DType>

  MSHADOW_XINLINE static DType Map(DType a, DType b) {

    return a + b;

  }

};

struct minus {

  template<typename DType>

  MSHADOW_XINLINE static DType Map(DType a, DType b) {

    return a - b;

  }

};

struct div {

  template<typename DType>

  MSHADOW_XINLINE static DType Map(DType a, DType b) {

    return a / b;

  }

};

struct right {

  template<typename DType>

  MSHADOW_XINLINE static DType Map(DType a, DType b) {

    return b;

  }

};

// unary operator/ function: example

// these operators can be defined by user,

// in the same style as binary and unary operator

// to use, simply write F<op::identity>( src )

struct identity{

  template<typename DType>

  MSHADOW_XINLINE static DType Map(DType a) {

    return a;

  }

};

}  // namespace op

namespace sv {

struct saveto {

  template<typename DType>

  MSHADOW_XINLINE static void Save(DType &a, DType b) { // NOLINT(*)

    a = b;

  }

  inline static default_real_t AlphaBLAS(void) { return 1.0f; }

  inline static default_real_t BetaBLAS(void) { return 0.0f; }

  typedef op::right OPType;

};

struct plusto {

  template<typename DType>

  MSHADOW_XINLINE static void Save(DType &a, DType b) { // NOLINT(*)

    a += b;

  }

  inline static default_real_t AlphaBLAS(void) { return 1.0f; }

  inline static default_real_t BetaBLAS(void) { return 1.0f; }

  typedef op::plus OPType;

};

struct minusto {

  template<typename DType>

  MSHADOW_XINLINE static void Save(DType &a, DType b) { // NOLINT(*)

    a -= b;

  }

  inline static default_real_t AlphaBLAS(void) { return -1.0f; }

  inline static default_real_t BetaBLAS(void) { return 1.0f; }

  typedef op::minus OPType;

};

struct multo {

  template<typename DType>

  MSHADOW_XINLINE static void Save(DType &a, DType b) { // NOLINT(*)

    a *= b;

  }

  typedef op::mul OPType;

};

struct divto {

  template<typename DType>

  MSHADOW_XINLINE static void Save(DType& a, DType b) { // NOLINT(*)

    a /= b;

  }

  typedef op::div OPType;

};

}  // namespace sv


#ifndef __CUDA_ARCH__

using std::isnan;

using std::isinf;

#endif


namespace isnan_typed {

  template<typename DType>

  MSHADOW_XINLINE bool IsNan(volatile DType val) {

    return false;

  }

  template<>

  MSHADOW_XINLINE bool IsNan(volatile float val) {

    return isnan(val);

  }

  template<>

  MSHADOW_XINLINE bool IsNan(volatile double val) {

    return isnan(val);

  }

  template<>

  MSHADOW_XINLINE bool IsNan(volatile long double val) {

    return isnan(val);

  }

  template<>

  MSHADOW_XINLINE bool IsNan(volatile mshadow::half::half_t val) {

    return (val.half_ & (~MSHADOW_HALF_SIGN_BIT)) > MSHADOW_HALF_EXPONENT_BITS;

  }

  template <>

  MSHADOW_XINLINE bool IsNan(volatile mshadow::bfloat::bf16_t val) {

    return (val.bf16_ & (~MSHADOW_BF16_SIGN_BIT)) > MSHADOW_BF16_EXPONENT_BITS;

  }

}  // namespace isnan_typed


namespace isinf_typed {

  template<typename DType>

  MSHADOW_XINLINE bool IsInf(volatile DType val) {

    return false;

  }

  template<>

  MSHADOW_XINLINE bool IsInf(volatile float val) {

    return isinf(val);

  }

  template<>

  MSHADOW_XINLINE bool IsInf(volatile double val) {

    return isinf(val);

  }

  template<>

  MSHADOW_XINLINE bool IsInf(volatile long double val) {

    return isinf(val);

  }

  template<>

  MSHADOW_XINLINE bool IsInf(volatile mshadow::half::half_t val) {

    return (val.half_ & (~MSHADOW_HALF_SIGN_BIT)) == MSHADOW_HALF_EXPONENT_BITS;

  }

  template <>

  MSHADOW_XINLINE bool IsInf(volatile mshadow::bfloat::bf16_t val) {

    return (val.bf16_ & (~MSHADOW_BF16_SIGN_BIT)) == MSHADOW_BF16_EXPONENT_BITS;

  }

}  // namespace isinf_typed


namespace red {

namespace limits {

template<typename DType>

MSHADOW_XINLINE DType MinValue(void);

template<>

MSHADOW_XINLINE float MinValue<float>(void) {

  return -FLT_MAX;

}

template<>

MSHADOW_XINLINE double MinValue<double>(void) {

  return -DBL_MAX;

}

template<>

MSHADOW_XINLINE half::half_t MinValue<half::half_t>(void) {

  return MSHADOW_HALF_MIN;

}

template<>

MSHADOW_XINLINE bfloat::bf16_t MinValue<bfloat::bf16_t>(void) {

  return MSHADOW_BF16_MIN;

}

template<>

MSHADOW_XINLINE uint8_t MinValue<uint8_t>(void) {

  return 0;

}

template<>

MSHADOW_XINLINE int8_t MinValue<int8_t>(void) {

  return SCHAR_MIN;

}

template<>

MSHADOW_XINLINE int MinValue<int32_t>(void) {

  return INT_MIN;

}

template<>

MSHADOW_XINLINE int64_t MinValue<int64_t>(void) {

  return LLONG_MIN;

}

template<>

MSHADOW_XINLINE bool MinValue<bool>(void) {

  return false;

}

template<>

MSHADOW_XINLINE unsigned int MinValue<unsigned int>(void) {

  return 0;

}


template<typename DType>

MSHADOW_XINLINE DType NegInfValue(void) {

  return MinValue<DType>();

}

template<>

MSHADOW_XINLINE float NegInfValue<float>(void) {

  return -HUGE_VALF;

}

template<>

MSHADOW_XINLINE double NegInfValue<double>(void) {

  return -HUGE_VAL;

}

template<>

MSHADOW_XINLINE half::half_t NegInfValue<half::half_t>(void) {

  return half::half_t::Binary(

      MSHADOW_HALF_SIGN_BIT | MSHADOW_HALF_EXPONENT_BITS);

}

template <>

MSHADOW_XINLINE bfloat::bf16_t NegInfValue<bfloat::bf16_t>(void) {

  return bfloat::bf16_t::Binary(MSHADOW_BF16_SIGN_BIT | MSHADOW_BF16_EXPONENT_BITS);

}


template<typename DType>

MSHADOW_XINLINE DType MaxValue(void);

template<>

MSHADOW_XINLINE float MaxValue<float>(void) {

  return FLT_MAX;

}

template<>

MSHADOW_XINLINE double MaxValue<double>(void) {

  return DBL_MAX;

}

template<>

MSHADOW_XINLINE half::half_t MaxValue<half::half_t>(void) {

  return MSHADOW_HALF_MAX;

}

template<>

MSHADOW_XINLINE bfloat::bf16_t MaxValue<bfloat::bf16_t>(void) {

  return MSHADOW_BF16_MAX;

}

template<>

MSHADOW_XINLINE uint8_t MaxValue<uint8_t>(void) {

  return UCHAR_MAX;

}

template<>

MSHADOW_XINLINE int8_t MaxValue<int8_t>(void) {

  return SCHAR_MAX;

}

template<>

MSHADOW_XINLINE int MaxValue<int32_t>(void) {

  return INT_MAX;

}

template<>

MSHADOW_XINLINE int64_t MaxValue<int64_t>(void) {

  return LLONG_MAX;

}

template<>

MSHADOW_XINLINE bool MaxValue<bool>(void) {

  return true;

}

template<>

MSHADOW_XINLINE uint32_t MaxValue<uint32_t>(void) {

  return std::numeric_limits<uint32_t>::max();

}


template<typename DType>

MSHADOW_XINLINE DType PosInfValue(void) {

  return MaxValue<DType>();

}

template<>

MSHADOW_XINLINE float PosInfValue<float>(void) {

  return HUGE_VALF;

}

template<>

MSHADOW_XINLINE double PosInfValue<double>(void) {

  return HUGE_VAL;

}

template<>

MSHADOW_XINLINE half::half_t PosInfValue<half::half_t>(void) {

  return half::half_t::Binary(MSHADOW_HALF_EXPONENT_BITS);

}

template <>

MSHADOW_XINLINE bfloat::bf16_t PosInfValue<bfloat::bf16_t>(void) {

  return bfloat::bf16_t::Binary(MSHADOW_BF16_EXPONENT_BITS);

}


}  // namespace limits


struct sum {

  template<typename DType>

  MSHADOW_XINLINE static void Reduce(volatile DType& dst,  volatile DType src) { // NOLINT(*)

    dst += src;

  }

  template<typename DType>

  MSHADOW_XINLINE static void Reduce(volatile DType& dst,  volatile DType src, volatile DType& residual) { // NOLINT(*)

    DType y = src - residual;

    DType t = dst + y;

    if (isinf_typed::IsInf(t)) {

      residual = 0;

    } else {

      residual = (t - dst) - y;

    }

    dst = t;

  }

  template<typename DType>

  MSHADOW_XINLINE static void Merge(volatile DType& dst_val, volatile DType& src_val) { // NOLINT(*)

    Reduce(dst_val, src_val);

  }

  template<typename DType>

  MSHADOW_XINLINE static void Merge(volatile DType& dst_val, volatile DType& dst_residual, volatile DType& src_val, volatile DType& src_residual) { // NOLINT(*)

    DType t1 = dst_val + src_val;

    if (isinf_typed::IsInf(t1)) {

      dst_val = t1;

      dst_residual = 0;

    } else {

      DType e = t1 - dst_val;

      DType t2 = ((src_val - e) + (dst_val - (t1 - e))) + dst_residual + src_residual;

      dst_val = t1 + t2;

      dst_residual = t2 - (dst_val - t1);

    }

  }

  template<typename DType>

  MSHADOW_XINLINE static void Finalize(volatile DType& dst) {} // NOLINT(*)

  template<typename DType>

  MSHADOW_XINLINE static void Finalize(volatile DType& dst, volatile DType& residual) {} // NOLINT(*)

  template<typename DType>

  MSHADOW_XINLINE static DType PartialGrad(DType redres, DType redsrc) {

    return 1;

  }

  template<typename DType>

  MSHADOW_XINLINE static void SetInitValue(DType &initv) { // NOLINT(*)

    initv = 0;

  }

  template<typename DType>

  MSHADOW_XINLINE static void SetInitValue(DType &initv, DType &residual) { // NOLINT(*)

    SetInitValue(initv);

    residual = 0;

  }

};

struct maximum {

  template<typename DType>

  MSHADOW_XINLINE static void Reduce(volatile DType& dst,  volatile DType src) { // NOLINT(*)

    if (!isnan_typed::IsNan(dst)) {

      if (!(dst >= src)) dst = src;

    }

  }

  template<typename DType>

  MSHADOW_XINLINE static void Reduce(volatile DType& dst,  volatile DType src, volatile DType &none) { // NOLINT(*)

    Reduce(dst, src);

  }

  template<typename DType>

  MSHADOW_XINLINE static void Merge(volatile DType& dst_val, volatile DType& src_val) { // NOLINT(*)

    Reduce(dst_val, src_val);

  }

  template<typename DType>

  MSHADOW_XINLINE static void Merge(volatile DType& dst_val, volatile DType& dst_residual, volatile DType& src_val, volatile DType& src_residual) { // NOLINT(*)

    Reduce(dst_val, src_val);

  }

  template<typename DType>

  MSHADOW_XINLINE static void Finalize(volatile DType& dst) {} // NOLINT(*)

  template<typename DType>

  MSHADOW_XINLINE static void Finalize(volatile DType& dst, volatile DType& residual) {} // NOLINT(*)

  template<typename DType>

  MSHADOW_XINLINE static DType PartialGrad(DType redres, DType redsrc) {

    return redres == redsrc ? 1: 0;

  }

  template<typename DType>

  MSHADOW_XINLINE static void SetInitValue(DType &initv) { // NOLINT(*)

    initv = limits::NegInfValue<DType>();

  }

  template<typename DType>

  MSHADOW_XINLINE static void SetInitValue(DType &initv, DType &none) { // NOLINT(*)

    SetInitValue(initv);

  }

};

struct minimum {

  template<typename DType>

  MSHADOW_XINLINE static void Reduce(volatile DType& dst,  volatile DType src) { // NOLINT(*)

    if (!isnan_typed::IsNan(dst)) {

      if (!(dst <= src)) dst = src;

    }

  }

  template<typename DType>

  MSHADOW_XINLINE static void Reduce(volatile DType& dst,  volatile DType src, volatile DType &none) { // NOLINT(*)

    Reduce(dst, src);

  }

  template<typename DType>

  MSHADOW_XINLINE static void Merge(volatile DType& dst_val, volatile DType& src_val) { // NOLINT(*)

    Reduce(dst_val, src_val);

  }

  template<typename DType>

  MSHADOW_XINLINE static void Merge(volatile DType& dst_val, volatile DType& dst_residual, volatile DType& src_val, volatile DType& src_residual) { // NOLINT(*)

    Reduce(dst_val, src_val);

  }

  template<typename DType>

  MSHADOW_XINLINE static void Finalize(volatile DType& dst) {} // NOLINT(*)

  template<typename DType>

  MSHADOW_XINLINE static void Finalize(volatile DType& dst, volatile DType& residual) {} // NOLINT(*)

  template<typename DType>

  MSHADOW_XINLINE static DType PartialGrad(DType redres, DType redsrc) {

    return redres == redsrc ? 1: 0;

  }

  template<typename DType>

  MSHADOW_XINLINE static void SetInitValue(DType &initv) { // NOLINT(*)

    initv = limits::PosInfValue<DType>();

  }

  template<typename DType>

  MSHADOW_XINLINE static void SetInitValue(DType &initv, DType &none) { // NOLINT(*)

    SetInitValue(initv);

  }

};

}  // namespace red


#ifndef __NVCC__

#define MSHADOW_TYPE_SWITCH(type, DType, ...)       \

  switch (type) {                                   \

  case mshadow::kFloat32:                           \

    {                                               \

      typedef float DType;                          \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat64:                           \

    {                                               \

      typedef double DType;                         \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat16:                           \

    {                                               \

      typedef mshadow::half::half_t DType;          \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kBfloat16:                          \

    {                                               \

      typedef mshadow::bfloat::bf16_t DType;        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kUint8:                             \

    {                                               \

      typedef uint8_t DType;                        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kInt8:                              \

    {                                               \

      typedef int8_t DType;                         \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kInt32:                             \

    {                                               \

      typedef int32_t DType;                        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kInt64:                             \

    {                                               \

      typedef int64_t DType;                        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kBool:                              \

    LOG(FATAL) << "This operation does not "        \

                  "support bool type";              \

    break;                                          \

  case mshadow::kInt16:                             \

    LOG(FATAL) << "This operation does not "        \

                  "support int16 type";             \

    break;                                          \

  case mshadow::kUint16:                            \

    LOG(FATAL) << "This operation does not "        \

                  "support uint16 type";            \

    break;                                          \

  case mshadow::kUint32:                            \

    LOG(FATAL) << "This operation does not "        \

                  "support uint32 type";            \

    break;                                          \

  case mshadow::kUint64:                            \

    LOG(FATAL) << "This operation does not "        \

                  "support uint64 type";            \

    break;                                          \

  default:                                          \

    LOG(FATAL) << "Unknown type enum " << type;     \

  }

#else

#define MSHADOW_TYPE_SWITCH(type, DType, ...)       \

  switch (type) {                                   \

  case mshadow::kFloat32:                           \

    {                                               \

      typedef float DType;                          \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat64:                           \

    {                                               \

      typedef double DType;                         \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat16:                           \

    {                                               \

      typedef mshadow::half::half_t DType;          \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kUint8:                             \

    {                                               \

      typedef uint8_t DType;                        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kInt8:                              \

    {                                               \

      typedef int8_t DType;                         \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kInt32:                             \

    {                                               \

      typedef int32_t DType;                        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kInt64:                             \

    {                                               \

      typedef int64_t DType;                        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kBool:                              \

    LOG(FATAL) << "This operation does not "        \

                  "support bool type";              \

    break;                                          \

  case mshadow::kInt16:                             \

    LOG(FATAL) << "This operation does not "        \

                  "support int16 type";             \

    break;                                          \

  case mshadow::kUint16:                            \

    LOG(FATAL) << "This operation does not "        \

                  "support uint16 type";            \

    break;                                          \

  case mshadow::kUint32:                            \

    LOG(FATAL) << "This operation does not "        \

                  "support uint32 type";            \

    break;                                          \

  case mshadow::kUint64:                            \

    LOG(FATAL) << "This operation does not "        \

                  "support uint64 type";            \

    break;                                          \

  default:                                          \

    LOG(FATAL) << "Unknown type enum " << type;     \

  }

#endif


#define MSHADOW_SGL_DBL_TYPE_SWITCH(type, DType, ...)  \

  switch (type) {                                      \

  case mshadow::kFloat32:                              \

    {                                                  \

      typedef float DType;                             \

      {__VA_ARGS__}                                    \

    }                                                  \

    break;                                             \

  case mshadow::kFloat64:                              \

    {                                                  \

      typedef double DType;                            \

      {__VA_ARGS__}                                    \

    }                                                  \

    break;                                             \

  default:                                             \

    LOG(FATAL) << "This operation only supports "      \

                  "32-bit and 64-bit floating point";  \

  }


#define MSHADOW_REAL_TYPE_SWITCH(type, DType, ...)  \

  switch (type) {                                   \

  case mshadow::kFloat32:                           \

    {                                               \

      typedef float DType;                          \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat64:                           \

    {                                               \

      typedef double DType;                         \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat16:                           \

    {                                               \

      typedef mshadow::half::half_t DType;          \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kUint8:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint8"; \

    break;                                          \

  case mshadow::kInt8:                              \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not int8";  \

    break;                                          \

  case mshadow::kInt32:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int32";\

    break;                                          \

  case mshadow::kInt64:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int64";\

    break;                                          \

  case mshadow::kBool:                              \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not bool"; \

    break;                                          \

  case mshadow::kInt16:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int16";\

    break;                                          \

  case mshadow::kUint16:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint16";\

    break;                                          \

  case mshadow::kUint32:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint32";\

    break;                                          \

  case mshadow::kUint64:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint64";\

    break;                                          \

  default:                                          \

    LOG(FATAL) << "Unknown type enum " << type;     \

  }


#ifndef __NVCC__

#define MSHADOW_REAL_TYPE_SWITCH_EX(type$, DType$, DLargeType$, ...)  \

  switch (type$) {                                  \

  case mshadow::kFloat32:                           \

    {                                               \

      typedef float DType$;                         \

      typedef float DLargeType$;                    \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat64:                           \

    {                                               \

      typedef double DType$;                        \

      typedef double DLargeType$;                   \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat16:                           \

    {                                               \

      typedef mshadow::half::half_t DType$;         \

      typedef float DLargeType$;                    \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kBfloat16:                          \

    {                                               \

      typedef mshadow::bfloat::bf16_t DType$;       \

      typedef float DLargeType$;                    \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kUint8:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint8"; \

    break;                                          \

  case mshadow::kInt8:                              \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not int8";  \

    break;                                          \

  case mshadow::kInt32:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int32";\

    break;                                          \

  case mshadow::kInt64:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int64";\

    break;                                          \

  case mshadow::kBool:                              \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not bool"; \

    break;                                          \

  case mshadow::kInt16:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int16";\

    break;                                          \

  case mshadow::kUint16:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint16";\

    break;                                          \

  case mshadow::kUint32:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint32";\

    break;                                          \

  case mshadow::kUint64:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint64";\

    break;                                          \

  default:                                          \

    LOG(FATAL) << "Unknown type enum " << type$;    \

  }

#else

#define MSHADOW_REAL_TYPE_SWITCH_EX(type$, DType$, DLargeType$, ...)  \

  switch (type$) {                                  \

  case mshadow::kFloat32:                           \

    {                                               \

      typedef float DType$;                         \

      typedef float DLargeType$;                    \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat64:                           \

    {                                               \

      typedef double DType$;                        \

      typedef double DLargeType$;                   \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kFloat16:                           \

    {                                               \

      typedef mshadow::half::half_t DType$;         \

      typedef float DLargeType$;                    \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kUint8:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint8"; \

    break;                                          \

  case mshadow::kInt8:                              \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not int8";  \

    break;                                          \

  case mshadow::kInt32:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int32";\

    break;                                          \

  case mshadow::kInt64:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int64";\

    break;                                          \

  case mshadow::kBool:                              \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not bool"; \

    break;                                          \

  case mshadow::kInt16:                             \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types, not int16";\

    break;                                          \

  case mshadow::kUint16:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint16";\

    break;                                          \

  case mshadow::kUint32:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint32";\

    break;                                          \

  case mshadow::kUint64:                            \

    LOG(FATAL) << "This operation only support "    \

                  "floating point types not uint64";\

    break;                                          \

  default:                                          \

    LOG(FATAL) << "Unknown type enum " << type$;    \

  }

#endif

#define MSHADOW_LAYOUT_SWITCH(layout, Layout, ...)  \

  switch (layout) {                                 \

  case mshadow::kNCHW:                              \

    {                                               \

      const int Layout = kNCHW;                     \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kNHWC:                              \

    {                                               \

      const int Layout = kNHWC;                     \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kNCDHW:                             \

    {                                               \

      const int Layout = kNCDHW;                    \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  case mshadow::kNDHWC:                             \

    {                                               \

      const int Layout = kNDHWC;                    \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  default:                                          \

    LOG(FATAL) << "Unknown layout enum " << layout; \

  }


#define MSHADOW_IDX_TYPE_SWITCH(type, DType, ...)   \

  switch (type) {                                   \

  case mshadow::kInt64:                             \

    {                                               \

      typedef int64_t DType;                        \

      {__VA_ARGS__}                                 \

    }                                               \

    break;                                          \

  default:                                          \

    LOG(FATAL) << "Unknown type enum " << type;     \

  }


#define MSHADOW_TYPE_SWITCH_WITH_BOOL(type, DType, ...)       \

  switch (type) {                                             \

  case mshadow::kFloat32:                                     \

    {                                                         \

      typedef float DType;                                    \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kFloat64:                                     \

    {                                                         \

      typedef double DType;                                   \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kFloat16:                                     \

    {                                                         \

      typedef mshadow::half::half_t DType;                    \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kBfloat16:                                    \

    {                                                         \

      typedef mshadow::bfloat::bf16_t DType;                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint8:                                       \

    {                                                         \

      typedef uint8_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt8:                                        \

    {                                                         \

      typedef int8_t DType;                                   \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt32:                                       \

    {                                                         \

      typedef int32_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt64:                                       \

    {                                                         \

      typedef int64_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kBool:                                        \

    {                                                         \

      typedef bool DType;                                     \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt16:                                       \

    LOG(FATAL) << "This operation does not "                  \

                  "support int16 type";                       \

    break;                                                    \

  case mshadow::kUint16:                                      \

    LOG(FATAL) << "This operation does not "                  \

                  "support uint16 type";                      \

    break;                                                    \

  case mshadow::kUint32:                                      \

    LOG(FATAL) << "This operation does not "                  \

                  "support uint32 type";                      \

    break;                                                    \

  case mshadow::kUint64:                                      \

    LOG(FATAL) << "This operation does not "                  \

                  "support uint64 type";                      \

    break;                                                    \

  default:                                                    \

    LOG(FATAL) << "Unknown type enum " << type;               \

  }


#define MSHADOW_TYPE_SWITCH_EXT(type, DType, ...)             \

  switch (type) {                                             \

  case mshadow::kFloat32:                                     \

    {                                                         \

      typedef float DType;                                    \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kFloat64:                                     \

    {                                                         \

      typedef double DType;                                   \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kFloat16:                                     \

    {                                                         \

      typedef mshadow::half::half_t DType;                    \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kBfloat16:                                    \

    {                                                         \

      typedef mshadow::bfloat::bf16_t DType;                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint8:                                       \

    {                                                         \

      typedef uint8_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt8:                                        \

    {                                                         \

      typedef int8_t DType;                                   \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt32:                                       \

    {                                                         \

      typedef int32_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt64:                                       \

    {                                                         \

      typedef int64_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt16:                                       \

    {                                                         \

      typedef int16_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint16:                                      \

    {                                                         \

      typedef uint16_t DType;                                 \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint32:                                      \

    {                                                         \

      typedef uint32_t DType;                                 \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint64:                                      \

    {                                                         \

      typedef uint64_t DType;                                 \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  default:                                                    \

    LOG(FATAL) << "Unknown type enum " << type;               \

  }


#define MSHADOW_TYPE_SWITCH_EXT_WITH_BOOL(type, DType, ...)   \

  switch (type) {                                             \

  case mshadow::kFloat32:                                     \

    {                                                         \

      typedef float DType;                                    \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kFloat64:                                     \

    {                                                         \

      typedef double DType;                                   \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kFloat16:                                     \

    {                                                         \

      typedef mshadow::half::half_t DType;                    \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kBfloat16:                                    \

    {                                                         \

      typedef mshadow::bfloat::bf16_t DType;                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint8:                                       \

    {                                                         \

      typedef uint8_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt8:                                        \

    {                                                         \

      typedef int8_t DType;                                   \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt32:                                       \

    {                                                         \

      typedef int32_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt64:                                       \

    {                                                         \

      typedef int64_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kBool:                                        \

    {                                                         \

      typedef bool DType;                                     \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kInt16:                                       \

    {                                                         \

      typedef int16_t DType;                                  \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint16:                                      \

    {                                                         \

      typedef uint16_t DType;                                 \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint32:                                      \

    {                                                         \

      typedef uint32_t DType;                                 \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  case mshadow::kUint64:                                      \

    {                                                         \

      typedef uint64_t DType;                                 \

      {__VA_ARGS__}                                           \

    }                                                         \

    break;                                                    \

  default:                                                    \

    LOG(FATAL) << "Unknown type enum " << type;               \

  }


inline size_t mshadow_sizeof(int type) {

  int size = 0;

  MSHADOW_TYPE_SWITCH_EXT_WITH_BOOL(type, DType, size = sizeof(DType););

  return size;

}


/*/ \brief get string with the type name from type enum */

inline std::string dtype_string(const int dtype) {

  switch (dtype) {

    case mshadow::kFloat32:

      return "float";

    case mshadow::kFloat64:

      return "double";

    case mshadow::kFloat16:

      return "half";

    case mshadow::kUint8:

      return "unsigned char";

    case mshadow::kInt8:

      return "char";

    case mshadow::kInt32:

      return "int";

    case mshadow::kInt64:

      return "long long";

    case mshadow::kBool:

      return "bool";

    case mshadow::kInt16:

      return "short";

    case mshadow::kUint16:

      return "unsigned short";

    case mshadow::kUint32:

      return "unsigned int";

    case mshadow::kUint64:

      return "unsigned long long";

    default:

      LOG(FATAL) << "Unknown type enum " << dtype;

  }

  return "unknown";

}


}  // namespace mshadow

#endif  // MSHADOW_BASE_H_