docs/api/imperative_8h_source.html

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */

 #ifndef MXNET_IMPERATIVE_H_
 #define MXNET_IMPERATIVE_H_

 #include <mxnet/op_attr_types.h>
 #include <mxnet/graph_attr_types.h>
 #include <mxnet/c_api.h>
 #include <nnvm/symbolic.h>
 #include <nnvm/op.h>
 #include <nnvm/graph.h>
 #include <vector>
 #include <atomic>
 #include <utility>
 #include <string>
 #include <unordered_map>

 #include "./ndarray.h"

 namespace mxnet {
   enum NumpyShape{Off, ThreadLocalOn, GlobalOn};
 class Imperative {
  public:
   class AGInfo {
    public:
     Context ctx;
     OpReqType grad_req;
     OpStatePtr state;
     std::vector<NDArray> outputs;
     std::vector<NDArray> out_grads;
     bool fresh_out_grad;

     AGInfo() :
       grad_req(kNullOp), fresh_out_grad(false) {}

     static void Clear(const nnvm::NodePtr& node) {
       if (node == nullptr || node->info.empty()) return;
       AGInfo& info = Get(node);
       if (info.grad_req != kNullOp) return;
       node->info.clear();
     }

     static AGInfo& Get(const nnvm::NodePtr& node) {
       return dmlc::get<AGInfo>(node->info);
     }

     static AGInfo& Create(const nnvm::NodePtr& node) {
       node->info.construct<AGInfo>();
       return Get(node);
     }

     static bool IsNone(const NDArray& arr) {
       return arr.entry_.node == nullptr || arr.entry_.node->info.empty();
     }

     static bool IsVariable(const nnvm::NodePtr& node) {
       AGInfo& info = Get(node);
       return info.grad_req != kNullOp && info.outputs.size() == 1
              && info.out_grads.size() == 1;
     }
   };
   bool is_training() const {
     return is_train_;
   }
   bool set_is_training(bool is_train) {
       bool old = is_train_;
       is_train_ = is_train;
       return old;
   }
   bool is_recording() const {
     return is_recording_;
   }
   bool set_is_recording(bool is_recording) {
       bool old = is_recording_;
       is_recording_ = is_recording;
       return old;
   }
   int is_np_shape() const {
     if (is_np_shape_global_) {
       return 2;
     }
     return is_np_shape_thread_local_ ? 1 : 0;
   }
   bool set_is_np_shape(int is_np_shape) {
     NumpyShape flag = static_cast<NumpyShape>(is_np_shape);
     bool old = this->is_np_shape();
     switch (flag) {
       case GlobalOn:
         is_np_shape_global_ = true;
         is_np_shape_thread_local_ = true;
         break;
       case ThreadLocalOn:
         is_np_shape_thread_local_ = true;
         break;
       case Off:
         is_np_shape_global_ = false;
         is_np_shape_thread_local_ = false;
         break;
     }
     return old;
   }
   void RecordOp(nnvm::NodeAttrs&& attrs,
                 const std::vector<NDArray*>& inputs,
                 const std::vector<NDArray*>& outputs,
                 const OpStatePtr& state = OpStatePtr(),
                 std::vector<bool>* p_save_inputs = nullptr,
                 std::vector<bool>* p_save_outputs = nullptr);
   OpStatePtr Invoke(const Context& default_ctx,
                     const nnvm::NodeAttrs& attrs,
                     const std::vector<NDArray*>& inputs,
                     const std::vector<NDArray*>& outputs);
   OpStatePtr InvokeOp(const Context& ctx,
                       const nnvm::NodeAttrs& attrs,
                       const std::vector<NDArray*>& inputs,
                       const std::vector<NDArray*>& outputs,
                       const std::vector<OpReqType>& req,
                       const DispatchMode dispatch_mode,
                       OpStatePtr state = OpStatePtr());
   void MarkVariables(const std::vector<NDArray*>& variables,
                      const std::vector<uint32_t>& grad_reqs,
                      const std::vector<NDArray*>& gradients);
   std::vector<NDArray*> Backward(const std::vector<NDArray*>& outputs,
                                  const std::vector<NDArray*>& ograds,
                                  const std::vector<NDArray*>& variables,
                                  bool is_train, bool retain_graph,
                                  bool create_graph);
   static Imperative* Get();
   static bool PreferBulkExecInference() {
     return dmlc::GetEnv("MXNET_EXEC_BULK_EXEC_INFERENCE", true);
   }
   static bool PreferBulkExecTrain() {
     return dmlc::GetEnv("MXNET_EXEC_BULK_EXEC_TRAIN", true);
   }
   static int BulkExecMaxNodeTrainFwd() {
     return dmlc::GetEnv("MXNET_EXEC_BULK_EXEC_MAX_NODE_TRAIN_FWD",
                         dmlc::GetEnv("MXNET_EXEC_BULK_EXEC_MAX_NODE_TRAIN", 15));
   }
   static int BulkExecMaxNodeTrainBwd() {
     return dmlc::GetEnv("MXNET_EXEC_BULK_EXEC_MAX_NODE_TRAIN_BWD",
                         dmlc::GetEnv("MXNET_EXEC_BULK_EXEC_MAX_NODE_TRAIN", 15));
   }

  private:
   friend class NDArray;
   Imperative() {
     if (PreferBulkExecTrain())
       backward_bulk_size_ = BulkExecMaxNodeTrainBwd();
   }
   void GetBackwardDependency(
       const nnvm::NodePtr& node,
       uint32_t num_inputs, uint32_t num_outputs,
       std::vector<bool> *p_save_inputs,
       std::vector<bool> *p_save_outputs);
 #if DMLC_CXX11_THREAD_LOCAL
   static thread_local bool is_train_;
   static thread_local bool is_recording_;
   // TOOD(junwu): Added numpy compatibility switch for backward compatibility.
   // Delete it in the next major release.
   static thread_local bool is_np_shape_thread_local_;
 #else
   static MX_THREAD_LOCAL bool is_train_;
   static MX_THREAD_LOCAL bool is_recording_;
   // TOOD(junwu): Added numpy compatibility switch for backward compatibility.
   // Delete it in the next major release.
   static MX_THREAD_LOCAL bool is_np_shape_thread_local_;
 #endif
   bool is_np_shape_global_{false};
   std::atomic<uint64_t> node_count_{0};
   std::atomic<uint64_t> variable_count_{0};
   int backward_bulk_size_{0};
 };

 }  // namespace mxnet
 #endif  // MXNET_IMPERATIVE_H_
mxnet::ThreadLocalOn
Definition: imperative.h:48

mxnet::Imperative::is_recording
bool is_recording() const
whether operator recording is on.
Definition: imperative.h:102

mxnet::Imperative::AGInfo::IsNone
static bool IsNone(const NDArray &arr)
Definition: imperative.h:81

mxnet::Imperative::BulkExecMaxNodeTrainFwd
static int BulkExecMaxNodeTrainFwd()
The max number of op nodes in a bulk during forward pass of training.
Definition: imperative.h:180

mxnet::Imperative::AGInfo::Create
static AGInfo & Create(const nnvm::NodePtr &node)
Definition: imperative.h:76

mxnet::Off
Definition: imperative.h:48

mxnet::Imperative::is_training
bool is_training() const
whether operator recording is on.
Definition: imperative.h:92

mxnet::kNullOp
no operation, do not write anything
Definition: op_attr_types.h:47

mxnet::Imperative::set_is_training
bool set_is_training(bool is_train)
turn on or turn off operator recording for autograd.
Definition: imperative.h:96

nnvm::NodeAttrs
The attributes of the current operation node. Usually are additional parameters like axis...
Definition: node.h:120

mxnet
namespace of mxnet
Definition: base.h:89

mxnet::Imperative::Backward
std::vector< NDArray * > Backward(const std::vector< NDArray * > &outputs, const std::vector< NDArray * > &ograds, const std::vector< NDArray * > &variables, bool is_train, bool retain_graph, bool create_graph)
compute the gradient of outputs w.r.t variables.

mxnet::Imperative::AGInfo::Clear
static void Clear(const nnvm::NodePtr &node)
Definition: imperative.h:65

mxnet::Imperative::Invoke
OpStatePtr Invoke(const Context &default_ctx, const nnvm::NodeAttrs &attrs, const std::vector< NDArray * > &inputs, const std::vector< NDArray * > &outputs)

nnvm::NodePtr
std::shared_ptr< Node > NodePtr
we always used NodePtr for a reference pointer to the node, so this alias can be changed in case...
Definition: node.h:49

mxnet::Imperative::AGInfo::AGInfo
AGInfo()
Definition: imperative.h:62

mxnet::DispatchMode
DispatchMode
the dispatch mode of the operator
Definition: op_attr_types.h:122

nnvm::NodeEntry::node
NodePtr node
the source node of this data
Definition: node.h:76

mxnet::Imperative::AGInfo::outputs
std::vector< NDArray > outputs
Definition: imperative.h:58

mxnet::Imperative::is_np_shape
int is_np_shape() const
return current numpy compatibility status, GlobalOn(2), ThreadLocalOn(1), Off(0). ...
Definition: imperative.h:114

mxnet::Imperative::AGInfo
Definition: imperative.h:53

mxnet::Imperative::set_is_recording
bool set_is_recording(bool is_recording)
turn on or turn off operator recording for autograd.
Definition: imperative.h:106

c_api.h

mxnet::Imperative::AGInfo::fresh_out_grad
bool fresh_out_grad
Definition: imperative.h:60

mxnet::Imperative::AGInfo::state
OpStatePtr state
Definition: imperative.h:57

mxnet::Imperative::AGInfo::out_grads
std::vector< NDArray > out_grads
Definition: imperative.h:59

mxnet::Imperative::RecordOp
void RecordOp(nnvm::NodeAttrs &&attrs, const std::vector< NDArray * > &inputs, const std::vector< NDArray * > &outputs, const OpStatePtr &state=OpStatePtr(), std::vector< bool > *p_save_inputs=nullptr, std::vector< bool > *p_save_outputs=nullptr)
to record operator, return corresponding node.

mxnet::Imperative::AGInfo::grad_req
OpReqType grad_req
Definition: imperative.h:56

mxnet::Imperative::AGInfo::ctx
Context ctx
Definition: imperative.h:55

graph.h
Configuation of nnvm as well as basic data structure.

mxnet::OpReqType
OpReqType
operation request type to Forward and Backward
Definition: op_attr_types.h:45

mxnet::Imperative::InvokeOp
OpStatePtr InvokeOp(const Context &ctx, const nnvm::NodeAttrs &attrs, const std::vector< NDArray * > &inputs, const std::vector< NDArray * > &outputs, const std::vector< OpReqType > &req, const DispatchMode dispatch_mode, OpStatePtr state=OpStatePtr())

mxnet::Imperative::AGInfo::IsVariable
static bool IsVariable(const nnvm::NodePtr &node)
Definition: imperative.h:85

mxnet::Imperative
runtime functions for NDArray
Definition: imperative.h:50

mxnet::GlobalOn
Definition: imperative.h:48

mxnet::Imperative::AGInfo::Get
static AGInfo & Get(const nnvm::NodePtr &node)
Definition: imperative.h:72

op.h
Operator information structor.

graph_attr_types.h

mxnet::Imperative::PreferBulkExecTrain
static bool PreferBulkExecTrain()
Should op execution bulking be employed during training.
Definition: imperative.h:176

symbolic.h
Symbolic graph construction API.

mxnet::Imperative::BulkExecMaxNodeTrainBwd
static int BulkExecMaxNodeTrainBwd()
The max number of op nodes in a bulk during backward pass of training.
Definition: imperative.h:185

mxnet::Imperative::set_is_np_shape
bool set_is_np_shape(int is_np_shape)
specify numpy compatibility off, thread local on or global on.
Definition: imperative.h:121

mxnet::Imperative::PreferBulkExecInference
static bool PreferBulkExecInference()
Should op execution bulking be employed during inference.
Definition: imperative.h:172

mxnet::Imperative::MarkVariables
void MarkVariables(const std::vector< NDArray * > &variables, const std::vector< uint32_t > &grad_reqs, const std::vector< NDArray * > &gradients)
mark variables for computing gradients.

mxnet::Context
Context information about the execution environment.
Definition: base.h:102

ndarray.h

mxnet::NDArray
ndarray interface
Definition: ndarray.h:82

mxnet::NumpyShape
NumpyShape
there are three numpy shape flags based on priority. GlobalOn turn on numpy shape flag globally...
Definition: imperative.h:48

mxnet::OpStatePtr
Operator state. This is a pointer type, its content is mutable even if OpStatePtr is const...
Definition: op_attr_types.h:148

op_attr_types.h