Source code for mxnet.util

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.
"""general utility functions"""

import ctypes
import functools
import inspect
import threading
import tempfile
import platform
from contextlib import contextmanager

from struct import calcsize
from .base import (_LIB, check_call, c_str, py_str,
                   numeric_types, integer_types, long,
                   _MAX_VALUE_64_BIT_UNSIGNED_,
                   _MAX_VALUE_64_BIT_SIGNED_,
                   _MAX_VALUE_FLOAT32_REPRESENT_)


_np_ufunc_default_kwargs = {
    'where': True,
    'casting': 'same_kind',
    'order': 'K',
    'dtype': None,
    'subok': True,
}

_set_np_shape_logged = False
_set_np_array_logged = False
_set_np_default_dtype_logged = False


def get_gpu_count():
    size = ctypes.c_int()
    check_call(_LIB.MXGetGPUCount(ctypes.byref(size)))
    return size.value


def get_gpu_memory(gpu_dev_id):
    free_mem = ctypes.c_uint64(0)
    total_mem = ctypes.c_uint64(0)
    check_call(_LIB.MXGetGPUMemoryInformation64(gpu_dev_id, ctypes.byref(free_mem), ctypes.byref(total_mem)))
    return free_mem.value, total_mem.value


[docs]def set_np_shape(active): """Turns on/off NumPy shape semantics, in which `()` represents the shape of scalar tensors, and tuples with `0` elements, for example, `(0,)`, `(1, 0, 2)`, represent the shapes of zero-size tensors. This is turned off by default for keeping backward compatibility. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy within this semantics. Parameters ---------- active : bool Indicates whether to turn on/off NumPy shape semantics. Returns ------- A bool value indicating the previous state of NumPy shape semantics. Example ------- >>> import mxnet as mx >>> prev_state = mx.set_np_shape(True) >>> print(prev_state) False >>> print(mx.is_np_shape()) True """ global _set_np_shape_logged if active: if not _set_np_shape_logged: import logging logging.info('NumPy-shape semantics has been activated in your code. ' 'This is required for creating and manipulating scalar and zero-size ' 'tensors, which were not supported in MXNet before, as in the official ' 'NumPy library. Please DO NOT manually deactivate this semantics while ' 'using `mxnet.numpy` and `mxnet.numpy_extension` modules.') _set_np_shape_logged = True elif is_np_array(): raise ValueError('Deactivating NumPy shape semantics while NumPy array semantics is still' ' active is not allowed. Please consider calling `npx.reset_np()` to' ' deactivate both of them.') prev = ctypes.c_int() check_call(_LIB.MXSetIsNumpyShape(ctypes.c_int(active), ctypes.byref(prev))) return bool(prev.value)
[docs]def is_np_shape(): """Checks whether the NumPy shape semantics is currently turned on. In NumPy shape semantics, `()` represents the shape of scalar tensors, and tuples with `0` elements, for example, `(0,)`, `(1, 0, 2)`, represent the shapes of zero-size tensors. This is turned off by default for keeping backward compatibility. In the NumPy shape semantics, `-1` indicates an unknown size. For example, `(-1, 2, 2)` means that the size of the first dimension is unknown. Its size may be inferred during shape inference. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy within this semantics. Returns ------- A bool value indicating whether the NumPy shape semantics is currently on. Example ------- >>> import mxnet as mx >>> prev_state = mx.set_np_shape(True) >>> print(prev_state) False >>> print(mx.is_np_shape()) True """ curr = ctypes.c_bool() check_call(_LIB.MXIsNumpyShape(ctypes.byref(curr))) return curr.value
class _NumpyShapeScope(object): """Scope for managing NumPy shape semantics. In NumPy shape semantics, `()` represents the shape of scalar tensors, and tuples with `0` elements, for example, `(0,)`, `(1, 0, 2)`, represent the shapes of zero-size tensors. Do not use this class directly. Use `np_shape(active)` instead. Example:: with _NumpyShapeScope(True): y = model(x) backward([y]) """ def __init__(self, is_np_shape): #pylint: disable=redefined-outer-name self._enter_is_np_shape = is_np_shape self._prev_is_np_shape = None def __enter__(self): if self._enter_is_np_shape is not None: self._prev_is_np_shape = set_np_shape(self._enter_is_np_shape) def __exit__(self, ptype, value, trace): if self._enter_is_np_shape is not None and self._prev_is_np_shape != self._enter_is_np_shape: set_np_shape(self._prev_is_np_shape)
[docs]def np_shape(active=True): """Returns an activated/deactivated NumPy shape scope to be used in 'with' statement and captures code that needs the NumPy shape semantics, i.e. support of scalar and zero-size tensors. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy even within this scope. Parameters ---------- active : bool Indicates whether to activate NumPy-shape semantics. Returns ------- _NumpyShapeScope A scope object for wrapping the code w/ or w/o NumPy-shape semantics. Example:: with mx.np_shape(active=True): # A scalar tensor's shape is `()`, whose `ndim` is `0`. scalar = mx.nd.ones(shape=()) assert scalar.shape == () # If NumPy shape semantics is enabled, 0 in a shape means that # dimension contains zero elements. data = mx.sym.var("data", shape=(0, 2, 3)) ret = mx.sym.sin(data) arg_shapes, out_shapes, _ = ret.infer_shape() assert arg_shapes[0] == (0, 2, 3) assert out_shapes[0] == (0, 2, 3) # -1 means unknown shape dimension size in the new NumPy shape definition data = mx.sym.var("data", shape=(-1, 2, 3)) ret = mx.sym.sin(data) arg_shapes, out_shapes, _ = ret.infer_shape_partial() assert arg_shapes[0] == (-1, 2, 3) assert out_shapes[0] == (-1, 2, 3) # When a shape is completely unknown when NumPy shape semantics is on, it is # represented as `None` in Python. data = mx.sym.var("data") ret = mx.sym.sin(data) arg_shapes, out_shapes, _ = ret.infer_shape_partial() assert arg_shapes[0] is None assert out_shapes[0] is None with mx.np_shape(active=False): # 0 means unknown shape dimension size in the legacy shape definition. data = mx.sym.var("data", shape=(0, 2, 3)) ret = mx.sym.sin(data) arg_shapes, out_shapes, _ = ret.infer_shape_partial() assert arg_shapes[0] == (0, 2, 3) assert out_shapes[0] == (0, 2, 3) # When a shape is completely unknown in the legacy mode (default), its ndim is # equal to 0 and it is represented as `()` in Python. data = mx.sym.var("data") ret = mx.sym.sin(data) arg_shapes, out_shapes, _ = ret.infer_shape_partial() assert arg_shapes[0] == () assert out_shapes[0] == () """ return _NumpyShapeScope(active)
[docs]def use_np_shape(func): """A decorator wrapping a function or class with activated NumPy-shape semantics. When `func` is a function, this ensures that the execution of the function is scoped with NumPy shape semantics, such as the support for zero-dim and zero size tensors. When `func` is a class, it ensures that all the methods, static functions, and properties of the class are executed with the NumPy shape semantics. .. code-block:: python import mxnet as mx @mx.use_np_shape def scalar_one(): return mx.nd.ones(()) print(scalar_one()) @np.use_np_shape class ScalarTensor(object): def __init__(self, val=None): if val is None: val = ScalarTensor.random().value self._scalar = mx.nd.ones(()) * val def __repr__(self): print("Is __repr__ in np_shape semantics? {}!".format(str(np.is_np_shape()))) return str(self._scalar.asnumpy()) @staticmethod def random(): val = mx.nd.random.uniform().asnumpy().item() return ScalarTensor(val) @property def value(self): print("Is value property in np_shape semantics? {}!".format(str(np.is_np_shape()))) return self._scalar.asnumpy().item() print("Is global scope of np_shape activated? {}!".format(str(np.is_np_shape()))) scalar_tensor = ScalarTensor() print(scalar_tensor) Parameters ---------- func : a user-provided callable function or class to be scoped by the NumPy-shape semantics. Returns ------- Function or class A function or class wrapped in the NumPy-shape scope. """ if inspect.isclass(func): for name, method in inspect.getmembers( func, predicate= lambda f: inspect.isfunction(f) or inspect.ismethod(f) or isinstance(f, property)): if isinstance(method, property): setattr(func, name, property(use_np_shape(method.__get__), method.__set__, method.__delattr__, method.__doc__)) else: setattr(func, name, use_np_shape(method)) return func elif callable(func): @functools.wraps(func) def _with_np_shape(*args, **kwargs): with np_shape(active=True): return func(*args, **kwargs) return _with_np_shape else: raise TypeError('use_np_shape can only decorate classes and callable objects, ' 'while received a {}'.format(str(type(func))))
def _sanity_check_params(func_name, unsupported_params, param_dict): for param_name in unsupported_params: if param_name in param_dict: raise NotImplementedError("function {} does not support parameter {}" .format(func_name, param_name))
[docs]def set_module(module): """Decorator for overriding __module__ on a function or class. Example usage:: @set_module('mxnet.numpy') def example(): pass assert example.__module__ == 'numpy' """ def decorator(func): if module is not None: func.__module__ = module return func return decorator
class _NumpyArrayScope(object): """Scope for managing NumPy array creation. This is often used with `is_np_array=True` in initializer to enforce array creation as type `mxnet.numpy.ndarray`, instead of `mx.nd.NDArray` in Gluon. Do not use this class directly. Use `np_array(active)` instead. """ _current = threading.local() def __init__(self, is_np_array): # pylint: disable=redefined-outer-name self._old_scope = None self._is_np_array = is_np_array def __enter__(self): if not hasattr(_NumpyArrayScope._current, "value"): _NumpyArrayScope._current.value = _NumpyArrayScope(False) self._old_scope = _NumpyArrayScope._current.value _NumpyArrayScope._current.value = self return self def __exit__(self, ptype, value, trace): assert self._old_scope _NumpyArrayScope._current.value = self._old_scope
[docs]def np_array(active=True): """Returns an activated/deactivated NumPy-array scope to be used in 'with' statement and captures code that needs the NumPy-array semantics. Currently, this is used in Gluon to enforce array creation in `Block`s as type `mxnet.numpy.ndarray`, instead of `mx.nd.NDArray`. It is recommended to use the decorator `use_np_array` to decorate the classes that need this semantics, instead of using this function in a `with` statement unless you know exactly what has been scoped by this semantics. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy even within this scope. Parameters ---------- active : bool Indicates whether to activate NumPy-array semantics. Returns ------- _NumpyShapeScope A scope object for wrapping the code w/ or w/o NumPy-shape semantics. """ return _NumpyArrayScope(active)
[docs]def is_np_array(): """Checks whether the NumPy-array semantics is currently turned on. This is currently used in Gluon for checking whether an array of type `mxnet.numpy.ndarray` or `mx.nd.NDArray` should be created. For example, at the time when a parameter is created in a `Block`, an `mxnet.numpy.ndarray` is created if this returns true; else an `mx.nd.NDArray` is created. Normally, users are not recommended to use this API directly unless you known exactly what is going on under the hood. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy within this semantics. Returns ------- A bool value indicating whether the NumPy-array semantics is currently on. """ return _NumpyArrayScope._current.value._is_np_array if hasattr( _NumpyArrayScope._current, "value") else False
[docs]def use_np_array(func): """A decorator wrapping Gluon `Block`s and all its methods, properties, and static functions with the semantics of NumPy-array, which means that where ndarrays are created, `mxnet.numpy.ndarray`s should be created, instead of legacy ndarrays of type `mx.nd.NDArray`. For example, at the time when a parameter is created in a `Block`, an `mxnet.numpy.ndarray` is created if it's decorated with this decorator. .. code-block:: python import mxnet as mx from mxnet import gluon, nd, np from mxnet.gluon import Parameter class TestHybridBlock1(gluon.HybridBlock): def __init__(self): super(TestHybridBlock1, self).__init__() self.w = Parameter('w', shape=(2, 2)) def forward(self, x): return nd.dot(x, self.w.data()) x = mx.nd.ones((2, 2)) net1 = TestHybridBlock1() net1.initialize() out = net1.forward(x) for _, v in net1.collect_params().items(): assert type(v.data()) is mx.nd.NDArray assert type(out) is mx.nd.NDArray @mx.util.use_np_array class TestHybridBlock2(gluon.HybridBlock): def __init__(self): super(TestHybridBlock2, self).__init__() self.w = Parameter('w', shape=(2, 2)) def forward(self, x): return np.dot(x, self.w.data()) x = np.ones((2, 2)) net2 = TestHybridBlock2() net2.initialize() out = net2.forward(x) for _, v in net2.collect_params().items(): print(type(v.data())) assert type(v.data()) is np.ndarray assert type(out) is np.ndarray Parameters ---------- func : a user-provided callable function or class to be scoped by the NumPy-array semantics. Returns ------- Function or class A function or class wrapped in the NumPy-array scope. """ if inspect.isclass(func): for name, method in inspect.getmembers( func, predicate= lambda f: inspect.isfunction(f) or inspect.ismethod(f) or isinstance(f, property)): if isinstance(method, property): setattr(func, name, property(use_np_array(method.__get__), method.__set__, method.__delattr__, method.__doc__)) else: setattr(func, name, use_np_array(method)) return func elif callable(func): @functools.wraps(func) def _with_np_array(*args, **kwargs): with np_array(active=True): return func(*args, **kwargs) return _with_np_array else: raise TypeError('use_np_array can only decorate classes and callable objects, ' 'while received a {}'.format(str(type(func))))
[docs]def use_np(func): """A convenience decorator for wrapping user provided functions and classes in the scope of both NumPy-shape and NumPy-array semantics, which means that ``(1)`` empty tuples ``()`` and tuples with zeros, such as ``(0, 1)``, ``(1, 0, 2)``, will be treated as scalar tensors' shapes and zero-size tensors' shapes in shape inference functions of operators, instead of as unknown in legacy mode; (2) ndarrays of type :class:`mxnet.numpy.ndarray` should be created instead of :class:`mx.nd.NDArray`. .. code-block:: python import mxnet as mx from mxnet import gluon, nd, np from mxnet.gluon import Parameter class TestHybridBlock1(gluon.HybridBlock): def __init__(self): super(TestHybridBlock1, self).__init__() self.w = Parameter('w', shape=(2, 2)) def forward(self, x): return nd.dot(x, self.w.data()) + nd.ones((1,)) x = mx.nd.ones((2, 2)) net1 = TestHybridBlock1() net1.initialize() out = net1.forward(x) for _, v in net1.collect_params().items(): assert type(v.data()) is mx.nd.NDArray assert type(out) is mx.nd.NDArray @mx.util.use_np class TestHybridBlock2(gluon.HybridBlock): def __init__(self): super(TestHybridBlock2, self).__init__() self.w = Parameter('w', shape=(2, 2)) def forward(self, x): return np.dot(x, self.w.data()) + np.ones(()) x = np.ones((2, 2)) net2 = TestHybridBlock2() net2.initialize() out = net2.forward(x) for _, v in net2.collect_params().items(): print(type(v.data())) assert type(v.data()) is np.ndarray assert type(out) is np.ndarray Parameters ---------- func : a user-provided callable function or class to be scoped by the NumPy-shape and NumPy-array semantics. Returns ------- Function or class A function or class wrapped in the Numpy-shape and NumPy-array scope. """ return use_np_shape(use_np_array(func))
[docs]def wrap_np_unary_func(func): """A convenience decorator for wrapping numpy-compatible unary ufuncs to provide uniform error handling. Parameters ---------- func : a numpy-compatible unary function to be wrapped for better error handling. Returns ------- Function A function wrapped with proper error handling. """ @functools.wraps(func) def _wrap_np_unary_func(x, out=None, **kwargs): if len(kwargs) != 0: for key, value in kwargs.items(): # if argument is not in the set of ufunc arguments if key not in _np_ufunc_default_kwargs: raise TypeError("{} is an invalid keyword to function \'{}\'".format(key, func.__name__)) # if argument is one of the ufunc arguments, but not with the default value if value != _np_ufunc_default_kwargs[key]: # if the provided value of the argument is a legal option, raise NotImplementedError if np_ufunc_legal_option(key, value): raise NotImplementedError("{}={} is not implemented yet for operator {}" .format(key, str(value), func.__name__)) # otherwise raise TypeError with not understood error message raise TypeError("{}={} not understood for operator {}" .format(key, value, func.__name__)) return func(x, out=out) return _wrap_np_unary_func
[docs]def wrap_np_binary_func(func): """A convenience decorator for wrapping numpy-compatible binary ufuncs to provide uniform error handling. Parameters ---------- func : a numpy-compatible binary function to be wrapped for better error handling. Returns ------- Function A function wrapped with proper error handling. """ @functools.wraps(func) def _wrap_np_binary_func(x1, x2, out=None, **kwargs): if len(kwargs) != 0: for key, value in kwargs.items(): # if argument is not in the set of ufunc arguments if key not in _np_ufunc_default_kwargs: raise TypeError("{} is an invalid keyword to function \'{}\'".format(key, func.__name__)) # if argument is one of the ufunc arguments, but not with the default value if value != _np_ufunc_default_kwargs[key]: # if the provided value of the argument is a legal option, raise NotImplementedError if np_ufunc_legal_option(key, value): raise NotImplementedError("{}={} is not implemented yet".format(key, str(value))) # otherwise raise TypeError with not understood error message raise TypeError("{} {} not understood".format(key, value)) return func(x1, x2, out=out) return _wrap_np_binary_func
[docs]def wrap_data_api_statical_func(func): """ A convenience decorator for wrapping data apis standardized statical functions to provide context keyward backward compatibility Parameters ---------- func : a numpy-compatible array statical function to be wrapped for context keyward change. Returns ------- Function A function wrapped with context keyward changes. """ @functools.wraps(func) def _wrap_api_creation_func(*args, **kwargs): if len(kwargs) != 0: correction = kwargs.pop('ddof', None) if correction is not None: kwargs['correction'] = correction return func(*args, **kwargs) return _wrap_api_creation_func
[docs]def wrap_data_api_linalg_func(func): """ A convenience decorator for wrapping data apis standardized linalg functions to provide context keyward backward compatibility Parameters ---------- func : a numpy-compatible array linalg function to be wrapped for context keyward change. Returns ------- Function A function wrapped with context keyward changes. """ @functools.wraps(func) def _wrap_linalg_func(*args, **kwargs): if len(kwargs) != 0: upper = kwargs.pop('UPLO', None) rcond = kwargs.pop('rcond', None) tol = kwargs.pop('tol', None) if upper is not None: if upper == 'U': kwargs['upper'] = True else: kwargs['upper'] = False if rcond is not None: kwargs['rtol'] = rcond if tol is not None: kwargs['rtol'] = tol return func(*args, **kwargs) return _wrap_linalg_func
[docs]def wrap_sort_functions(func): """A convenience decorator for wrapping sort functions Parameters ---------- func : a numpy-compatible array creation function to be wrapped for parameter keyword change. Returns ------- Function A function wrapped with changed keywords. """ @functools.wraps(func) def _wrap_sort_func(*args, **kwargs): if len(kwargs) != 0: kind = kwargs.pop('kind', None) order = kwargs.pop('order', None) if kind is not None: kwargs['stable'] = kind == 'stable' if order is not None: raise NotImplementedError("order not supported here") return func(*args, **kwargs) return _wrap_sort_func
[docs]def wrap_ctx_to_device_func(func): """A convenience decorator for converting ctx to device keyward backward compatibility Parameters ---------- func : a function to be wrapped for context keyward change. Returns ------- Function A function wrapped with context keyward changes. """ @functools.wraps(func) def _wrap_func_with_ctx(*args, **kwargs): if len(kwargs) != 0: device = kwargs.pop('ctx', None) if device is not None: kwargs['device'] = device return func(*args, **kwargs) return _wrap_func_with_ctx
# pylint: disable=exec-used
[docs]def numpy_fallback(func): """decorator for falling back to offical numpy for a specific function""" def get_device(device, new_device): if device is None: return new_device else: if new_device is None: new_device = device assert device == new_device, f"inconsistent device {str(device)} and {str(new_device)}" return device def _as_official_np_array(object): device = None if hasattr(object, 'asnumpy'): return object.asnumpy(), object.device elif isinstance(object, (list, tuple)): tmp = [] for arr in object: new_arr, new_device = _as_official_np_array(arr) device = get_device(device, new_device) tmp.append(new_arr) return object.__class__(tmp), device elif isinstance(object, dict): tmp = {} for k, v in object.items(): new_v, new_device = _as_official_np_array(v) device = get_device(device, new_device) tmp[k] = new_v return tmp, device else: return object, None from .ndarray import from_numpy from .numpy import array from .device import current_device def _as_mx_np_array(object, device=current_device()): import numpy as _np if isinstance(object, _np.ndarray): try: ret = from_numpy(object).as_np_ndarray() except ValueError: ret = array(object, dtype=object.dtype, device=device) return (ret if ('cpu' in str(device)) else ret.to_device(device)) elif isinstance(object, (list, tuple)): tmp = [_as_mx_np_array(arr, device) for arr in object] return object.__class__(tmp) elif isinstance(object, dict): return {k:_as_mx_np_array(v, device) for k, v in object} else: return object import re func_name = func.__name__ func_doc = func.__doc__ func_source = inspect.getsource(func) func_source = re.sub(r'np\.', 'onp.', func_source) func_source = func_source.split('\n')[1:] indentation = func_source[0].find('def') if indentation == -1: raise ValueError("should wrap a function") stripped = [] for line in func_source: stripped.append(line[indentation:]) stripped.insert(1, ' import numpy as onp') func_source = '\n'.join(stripped) local = {} exec(func_source, None, local) func = local[func_name] func.__doc__ = func_doc @functools.wraps(func) def _fallback_to_official_np(*args, **kwargs): # for every ndarray input, fallback new_args, device0 = _as_official_np_array(args) new_kwargs, device1 = _as_official_np_array(kwargs) device = get_device(device0, device1) ret = func(*new_args, **new_kwargs) if ret is None: raise ValueError("Only functions with return values are allowed to use this decorator") ret = _as_mx_np_array(ret, device=device) return ret return _fallback_to_official_np
# pylint: enable=exec-used def _set_np_array(active): """Turns on/off NumPy array semantics for the current thread in which `mxnet.numpy.ndarray` is expected to be created, instead of the legacy `mx.nd.NDArray`. Parameters --------- active : bool A boolean value indicating whether the NumPy-array semantics should be turned on or off. Returns ------- A bool value indicating the previous state of NumPy array semantics. """ global _set_np_array_logged if active: if not _set_np_array_logged: import logging logging.info('NumPy array semantics has been activated in your code. This allows you' ' to use operators from MXNet NumPy and NumPy Extension modules as well' ' as MXNet NumPy `ndarray`s.') _set_np_array_logged = True cur_state = is_np_array() _NumpyArrayScope._current.value = _NumpyArrayScope(active) return cur_state
[docs]def set_np(shape=True, array=True, dtype=False): """Setting NumPy shape and array semantics at the same time. It is required to keep NumPy shape semantics active while activating NumPy array semantics. Deactivating NumPy shape semantics while NumPy array semantics is still active is not allowed. It is highly recommended to set these two flags to `True` at the same time to fully enable NumPy-like behaviors. Please refer to the Examples section for a better understanding. Parameters ---------- shape : bool A boolean value indicating whether the NumPy-shape semantics should be turned on or off. When this flag is set to `True`, zero-size and zero-dim shapes are all valid shapes in shape inference process, instead of treated as unknown shapes in legacy mode. array : bool A boolean value indicating whether the NumPy-array semantics should be turned on or off. When this flag is set to `True`, it enables Gluon code flow to use or generate `mxnet.numpy.ndarray`s instead of `mxnet.ndarray.NDArray`. For example, a `Block` would create parameters of type `mxnet.numpy.ndarray`. dtype : bool A boolean value indicating whether the NumPy-dtype semantics should be turned on or off. When this flag is set to `True`, default dtype is float64. When this flag is set to `False`, default dtype is float32. Examples -------- >>> import mxnet as mx Creating zero-dim ndarray in legacy mode would fail at shape inference. >>> mx.nd.ones(shape=()) mxnet.base.MXNetError: Operator _ones inferring shapes failed. >>> mx.nd.ones(shape=(2, 0, 3)) mxnet.base.MXNetError: Operator _ones inferring shapes failed. In legacy mode, Gluon layers would create parameters and outputs of type `mx.nd.NDArray`. >>> from mxnet.gluon import nn >>> dense = nn.Dense(2) >>> dense.initialize() >>> dense(mx.nd.ones(shape=(3, 2))) [[0.01983214 0.07832371] [0.01983214 0.07832371] [0.01983214 0.07832371]] <NDArray 3x2 @cpu(0)> >>> [p.data() for p in dense.collect_params().values()] [ [[0.0068339 0.01299825] [0.0301265 0.04819721]] <NDArray 2x2 @cpu(0)>, [0. 0.] <NDArray 2 @cpu(0)>] When the `shape` flag is `True`, both shape inferences are successful. >>> from mxnet import np, npx >>> npx.set_np() # this is required to activate NumPy-like behaviors >>> np.ones(shape=()) array(1.) >>> np.ones(shape=(2, 0, 3)) array([], shape=(2, 0, 3)) When the `array` flag is `True`, Gluon layers would create parameters and outputs of type `mx.np.ndarray`. >>> dense = nn.Dense(2) >>> dense.initialize() >>> dense(np.ones(shape=(3, 2))) array([[0.01983214, 0.07832371], [0.01983214, 0.07832371], [0.01983214, 0.07832371]]) >>> [p.data() for p in dense.collect_params().values()] [array([[0.0068339 , 0.01299825], [0.0301265 , 0.04819721]]), array([0., 0.])] >>> npx.set_np(dtype=True) >>> np.ones(shape=()).dtype dtype('float64') """ if not shape and array: raise ValueError('NumPy Shape semantics is required in using NumPy array semantics.') _set_np_array(array) set_np_shape(shape) set_np_default_dtype(dtype)
[docs]def reset_np(): """Deactivate NumPy shape and array and deafult dtype semantics at the same time.""" set_np(shape=False, array=False, dtype=False)
_CUDA_SUCCESS = 0
[docs]def get_cuda_compute_capability(device): """Returns the cuda compute capability of the input `device`. Parameters ---------- device : Device GPU context whose corresponding cuda compute capability is to be retrieved. Returns ------- cuda_compute_capability : int CUDA compute capability. For example, it returns 70 for CUDA arch equal to `sm_70`. References ---------- https://gist.github.com/f0k/63a664160d016a491b2cbea15913d549#file-cuda_check-py """ if device.device_type != 'gpu': raise ValueError('Expecting a gpu context to get cuda compute capability, ' 'while received device {}'.format(str(device))) libnames = ('libcuda.so', 'libcuda.dylib', 'nvcuda.dll', 'cuda.dll') for libname in libnames: try: cuda = ctypes.CDLL(libname) except OSError: continue else: break else: raise OSError("could not load any of: " + ' '.join(libnames)) # Some constants taken from cuda.h cc_major = ctypes.c_int() cc_minor = ctypes.c_int() cuda_device = ctypes.c_int() error_str = ctypes.c_char_p() ret = cuda.cuInit(0) if ret != _CUDA_SUCCESS: cuda.cuGetErrorString(ret, ctypes.byref(error_str)) raise RuntimeError('cuInit failed with erro code {}: {}' .format(ret, error_str.value.decode())) ret = cuda.cuDeviceGet(ctypes.byref(cuda_device), device.device_id) if ret != _CUDA_SUCCESS: cuda.cuGetErrorString(ret, ctypes.byref(error_str)) raise RuntimeError('cuDeviceGet failed with error code {}: {}' .format(ret, error_str.value.decode())) ret = cuda.cuDeviceComputeCapability(ctypes.byref(cc_major), ctypes.byref(cc_minor), cuda_device) if ret != _CUDA_SUCCESS: cuda.cuGetErrorString(ret, ctypes.byref(error_str)) raise RuntimeError('cuDeviceComputeCapability failed with error code {}: {}' .format(ret, error_str.value.decode())) return cc_major.value * 10 + cc_minor.value
[docs]def default_array(source_array, device=None, dtype=None): """Creates an array from any object exposing the default(nd or np) array interface. Parameters ---------- source_array : array_like An object exposing the array interface, an object whose `__array__` method returns an array, or any (nested) sequence. device : Device, optional Device context (default is the current default context). dtype : str or numpy.dtype, optional The data type of the output array. The default dtype is ``source_array.dtype`` if `source_array` is an `NDArray`, `float32` otherwise. Returns ------- NDArray An `NDArray`(nd or np) with the same contents as the `source_array`. """ from . import nd as _mx_nd from . import np as _mx_np if is_np_array(): return _mx_np.array(source_array, device=device, dtype=dtype) else: return _mx_nd.array(source_array, ctx=device, dtype=dtype)
class _NumpyDefaultDtypeScope(object): """Scope for managing NumPy default dtype semantics. In NumPy default dtype semantics, default dtype is 'float64', i.e. np.array([1, 2, 3]).dtype = np.float64 Original default dtype without this semantic is 'float32'. Do not use this class directly. Use `np_shape(active)` instead. Example:: with _NumpyDefaultDtypeScope(True): y = model(x) backward([y]) """ def __init__(self, is_np_default_dtype): #pylint: disable=redefined-outer-name self._enter_is_np_default_dtype = is_np_default_dtype self._prev_is_np_default_dtype = None def __enter__(self): if self._enter_is_np_default_dtype is not None: self._prev_is_np_default_dtype = set_np_default_dtype(self._enter_is_np_default_dtype) def __exit__(self, ptype, value, trace): if self._enter_is_np_default_dtype is not None and\ self._prev_is_np_default_dtype != self._enter_is_np_default_dtype: set_np_default_dtype(self._prev_is_np_default_dtype)
[docs]def np_default_dtype(active=True): """Returns an activated/deactivated NumPy-default_dtype scope to be used in 'with' statement and captures code that needs the NumPy default dtype semantics. i.e. default dtype is float64. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy even within this scope. Parameters ---------- active : bool Indicates whether to activate NumPy default dtype semantics. Returns ------- _NumpyDefaultDtypeScope A scope object for wrapping the code w/ or w/o NumPy-default_dtype semantics. Example:: with mx.np_default_dtype(active=True): # Default Dtype is 'float64', consistent with offical NumPy behavior. arr = mx.np.array([1, 2, 3]) assert arr.dtype == 'float64' with mx.np_default_dtype(active=False): # Default Dtype is 'float32' in the legacy default dtype definition. arr = mx.np.array([1, 2, 3]) assert arr.dtype == 'float32' """ return _NumpyDefaultDtypeScope(active)
[docs]def use_np_default_dtype(func): """A decorator wrapping a function or class with activated NumPy-default_dtype semantics. When `func` is a function, this ensures that the execution of the function is scoped with NumPy default dtype semantics, with the support for float64 as default dtype. When`func` is a class, it ensures that all the methods, static functions, and properties of the class are executed with the NumPy-default_dtype semantics. .. code-block:: python import mxnet as mx @mx.use_np_default_dtype def float64_one(): return mx.nd.ones(()).dtype print(float64_one()) @np.use_np_default_dtype class Float64Tensor(object): def __init__(self, data=None): if data is None: data = Float64Tensor.random().data self._data = data def __repr__(self): print("Is __repr__ in np_default_dtype semantics? {}!".format(str(np.is_np_deafult_dtype()))) return str(self._data.asnumpy()) @staticmethod def random(): data = mx.nd.random.uniform(shape=(2,2)) return ScalarTensor(data) @property def value(self): print("Is value property in np_dafault_dtype semantics? {}!".format(str(np.is_np_default_dtype()))) return self._data.asnumpy() print("Is global scope of np_default_dtype activated? {}!".format(str(np.is_np_default_dtype()))) float64_tensor = Float64Tensor() print(float64_tensor) Parameters ---------- func : a user-provided callable function or class to be scoped by the NumPy-default_dtype semantics. Returns ------- Function or class A function or class wrapped in the NumPy-default_dtype scope. """ if inspect.isclass(func): for name, method in inspect.getmembers( func, predicate= lambda f: inspect.isfunction(f) or inspect.ismethod(f) or isinstance(f, property)): if isinstance(method, property): setattr(func, name, property(use_np_default_dtype(method.__get__), method.__set__, method.__delattr__, method.__doc__)) else: setattr(func, name, use_np_default_dtype(method)) return func elif callable(func): @functools.wraps(func) def _with_np_default_dtype(*args, **kwargs): with np_default_dtype(active=True): return func(*args, **kwargs) return _with_np_default_dtype else: raise TypeError('use_np_default_dtype can only decorate classes and callable objects, ' 'while received a {}'.format(str(type(func))))
[docs]def is_np_default_dtype(): """Checks whether the NumPy default dtype semantics is currently turned on. In NumPy default dtype semantics, default dtype is float64. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy even within this scope. Returns ------- A bool value indicating whether the NumPy default dtype semantics is currently on. See Also -------- set_np_default_dtype : Set default dtype equals to offical numpy set_np : npx.set_np(dtype=True) has equal performance to npx.set_np_default_dtype(True) Example ------- >>> import mxnet as mx >>> from mxnet import npx >>> prev_state = npx.set_np_default_dtype(True) >>> print(prev_state) False >>> print(npx.is_np_default_dtype()) True """ curr = ctypes.c_bool() check_call(_LIB.MXIsNumpyDefaultDtype(ctypes.byref(curr))) return curr.value
[docs]def set_np_default_dtype(is_np_default_dtype=True): # pylint: disable=redefined-outer-name """Turns on/off NumPy default dtype semantics, because mxnet.numpy.ndarray use 32 bit data storage as default (e.g. float32 and int 32) while offical NumPy use 64 bit data storage as default (e.g. float64 and int64). This is turned off by default for keeping backward compatibility. Please note that this is designed as an infrastructure for the incoming MXNet-NumPy operators. Legacy operators registered in the modules `mx.nd` and `mx.sym` are not guaranteed to behave like their counterparts in NumPy within this semantics. Parameters ---------- active : bool Indicates whether to turn on/off NumPy default dtype semantics. Returns ------- A bool value indicating the previous state of NumPy default dtype semantics. Example ------- >>> import mxnet as mx >>> from mxnet import npx >>> prev_state = npx.set_np_default_dtype(True) >>> print(prev_state) False >>> print(npx.is_np_default_dtype()) True """ global _set_np_default_dtype_logged if is_np_default_dtype: if not _set_np_default_dtype_logged: import logging logging.info('NumPy array default dtype has been changed from flaot32 to float64 in your code.') _set_np_default_dtype_logged = True prev = ctypes.c_bool() check_call(_LIB.MXSetIsNumpyDefaultDtype(ctypes.c_bool(is_np_default_dtype), ctypes.byref(prev))) return prev.value
[docs]def getenv(name): """Get the setting of an environment variable from the C Runtime. Parameters ---------- name : string type The environment variable name Returns ------- value : string The value of the environment variable, or None if not set """ ret = ctypes.c_char_p() check_call(_LIB.MXGetEnv(c_str(name), ctypes.byref(ret))) return None if ret.value is None else py_str(ret.value)
[docs]def setenv(name, value): """Set an environment variable in the C Runtime. Parameters ---------- name : string type The environment variable name value : string type The desired value to set the environment value to """ passed_value = None if value is None else c_str(value) check_call(_LIB.MXSetEnv(c_str(name), passed_value))
[docs]def get_max_supported_compute_capability(): """Get the maximum compute capability (SM arch) supported by the nvrtc compiler """ max_supported_cc = ctypes.c_int() check_call(_LIB.MXGetMaxSupportedArch(ctypes.byref(max_supported_cc))) return max_supported_cc.value
[docs]def get_rtc_compile_opts(device): """Get the compile ops suitable for the context, given the toolkit/driver config """ device_cc = get_cuda_compute_capability(device) max_supported_cc = get_max_supported_compute_capability() # CUDA toolkits starting with 11.1 (first to support arch 86) can compile directly to SASS can_compile_to_SASS = max_supported_cc >= 86 should_compile_to_SASS = can_compile_to_SASS and \ device_cc <= max_supported_cc device_cc_as_used = min(device_cc, max_supported_cc) arch_opt = "--gpu-architecture={}_{}".format("sm" if should_compile_to_SASS else "compute", device_cc_as_used) return [arch_opt]
[docs]def set_flush_denorms(value): """Change floating-point calculations on CPU when dealing with denormalized values. This is only applicable to architectures which supports flush-to-zero. Denormalized values are positive and negative values that are very close to 0 (exponent is the smallest possible value). Flushing denormalized values to 0 can speedup calculations if such values occurs, but if fulfilling whole IEEE 754 standard is required this option should be disabled. Flushing denormalized values is enabled in MXNet by default. Parameters ---------- value : bool State of flush-to-zero and denormals-are-zero in MXCSR register Returns ------- prev_state : bool Previous state of flush-to-zero in MXCSR register """ ret = ctypes.c_bool() passed_value = ctypes.c_bool(value) check_call(_LIB.MXSetFlushDenorms(passed_value, ctypes.byref(ret))) return ret.value
[docs]def dtype_from_number(number): """Get the data type from the given int or float number """ assert isinstance(number, numeric_types),\ "The input number should be either int for float types" import numpy as _np if isinstance(number, (int, long)): if number > _MAX_VALUE_64_BIT_UNSIGNED_: raise OverflowError("Integer out of bounds") if number > _MAX_VALUE_64_BIT_SIGNED_: return _np.uint64 elif calcsize("P") == 8: return _np.int64 else: return _np.int32 elif isinstance(number, float): if abs(number) > _MAX_VALUE_FLOAT32_REPRESENT_ or \ ((not _np.isnan(number)) and \ (_np.float32(number) == int(number)) and \ (number != int(number))): return _np.float64 else: return _np.float64 if is_np_default_dtype() else _np.float32 elif isinstance(number, _np.generic): return number.dtype raise TypeError('type {} not supported'.format(str(type(number))))
# This is a wrapping of tempfile.TemporaryDirectory(), known to have cleanup issues on Windows. # The problem is partially handled as of Python 3.10 by the adding of a 'ignore_cleanup_errors' # parameter. Once MXNet's Python version is forced to be >= 3.10, a simplification of this # function to use 'ignore_cleanup_errors' would be possible. Until the fundamental Windows # issues are resolved, best to use this routine instead of tempfile.TemporaryDirectory().
[docs]@contextmanager def TemporaryDirectory(*args, **kwargs): """A context wrapper of tempfile.TemporaryDirectory() that ignores cleanup errors on Windows. """ dir = tempfile.TemporaryDirectory(*args, **kwargs) try: yield dir.name finally: try: dir.cleanup() except PermissionError: if platform.system() != 'Windows': raise