docs/api/cpp-package_2include_2mxnet-cpp_2executor_8h_source.html

/*

 * Licensed to the Apache Software Foundation (ASF) under one

 * or more contributor license agreements.  See the NOTICE file

 * distributed with this work for additional information

 * regarding copyright ownership.  The ASF licenses this file

 * to you under the Apache License, Version 2.0 (the

 * "License"); you may not use this file except in compliance

 * with the License.  You may obtain a copy of the License at

 *

 *   http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing,

 * software distributed under the License is distributed on an

 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

 * KIND, either express or implied.  See the License for the

 * specific language governing permissions and limitations

 * under the License.

 */


#ifndef MXNET_CPP_EXECUTOR_H_

#define MXNET_CPP_EXECUTOR_H_


#include <vector>

#include <map>

#include <set>

#include <string>

#include <algorithm>

#include "mxnet-cpp/base.h"

#include "mxnet-cpp/symbol.h"


namespace mxnet {

namespace cpp {


class Optimizer;


class Executor {

 public:

  Executor(const Symbol& symbol,

           Context context,

           const std::vector<NDArray>& arg_arrays,

           const std::vector<NDArray>& grad_arrays,

           const std::vector<OpReqType>& grad_reqs,

           const std::vector<NDArray>& aux_arrays,

           const std::map<std::string, Context>& group_to_ctx = std::map<std::string, Context>(),

           Executor* shared_exec                              = nullptr);

  explicit Executor(const CachedOpHandle& h) {

    handle_ = h;

  }

  void Forward(bool is_train) {

    std::vector<NDArrayHandle> arg_handles;

    for (const auto& array : combined_arrays) {

      arg_handles.push_back(array.GetHandle());

    }

    int prev_is_record  = 0;

    int prev_train_mode = 0;

    CHECK_EQ(MXAutogradSetIsRecording(1, &prev_is_record), 0);

    if (is_train == true) {

      CHECK_EQ(MXAutogradSetIsTraining(1, &prev_train_mode), 0);

    }

    std::vector<NDArrayHandle> output_handles;

    std::transform(

        outputs.begin(), outputs.end(), std::back_inserter(output_handles), [](NDArray& a) {

          return a.GetHandle();

        });

    int out_size             = 0;

    NDArrayHandle* out_array = nullptr;

    CHECK_EQ(MXInvokeCachedOp(handle_,

                              arg_handles.size(),

                              arg_handles.data(),

                              device_type,

                              device_id,

                              &out_size,

                              &out_array,

                              nullptr),

             0);

    outputs.clear();

    outputs.reserve(out_size);

    for (mx_uint i = 0; i < out_size; ++i) {

      outputs.push_back(NDArray(out_array[i]));

    }

    int cur_train_mode = prev_train_mode;

    int cur_is_record  = prev_is_record;

    if (is_train == true) {

      CHECK_EQ(MXAutogradSetIsTraining(cur_train_mode, &prev_train_mode), 0);

    }

    CHECK_EQ(MXAutogradSetIsRecording(cur_is_record, &prev_is_record), 0);

  }

  void Backward(const std::vector<NDArray>& head_grads = std::vector<NDArray>()) {

    if (require_grad == true) {

      if (outputs.size() == 0) {

        Forward(false);

      }

      std::vector<NDArrayHandle> out_handles;

      for (const auto& array : outputs) {

        out_handles.push_back(array.GetHandle());

      }

      std::vector<NDArrayHandle> head_grads_;

      for (auto d : head_grads) {

        head_grads_.push_back(d.GetHandle());

      }

      if (head_grads_.size() > 0) {

        CHECK_EQ(MXAutogradBackwardEx(out_handles.size(),

                                      out_handles.data(),

                                      head_grads_.data(),

                                      0,

                                      nullptr,

                                      0,

                                      0,

                                      1,

                                      nullptr,

                                      nullptr),

                 0);

      } else {

        CHECK_EQ(MXAutogradBackwardEx(out_handles.size(),

                                      out_handles.data(),

                                      nullptr,

                                      0,

                                      nullptr,

                                      0,

                                      0,

                                      1,

                                      nullptr,

                                      nullptr),

                 0);

      }

      grad_arrays.clear();

      grad_arrays.reserve(arg_arrays.size());

      for (const auto& array : arg_arrays) {

        NDArrayHandle grad;

        CHECK_EQ(MXNDArrayGetGrad(array.GetHandle(), &grad), 0);

        grad_arrays.push_back(NDArray(grad));

      }

    }

  }

  // TODO(zhangchen-qinyinghua)

  // To implement reshape function

  void Reshape();

  ~Executor() {

    MXFreeCachedOp(handle_);

  }

  std::vector<NDArray> arg_arrays;

  std::vector<NDArray> grad_arrays;

  std::vector<NDArray> aux_arrays;

  std::vector<NDArray> combined_arrays;

  int device_type;

  int device_id;

  bool require_grad;

  std::vector<NDArray> outputs;

  std::map<std::string, NDArray> arg_dict() {

    return GetDict(symbol_.ListArguments(), arg_arrays);

  }

  std::map<std::string, NDArray> grad_dict() {

    return GetDict(symbol_.ListArguments(), grad_arrays);

  }

  std::map<std::string, NDArray> aux_dict() {

    return GetDict(symbol_.ListAuxiliaryStates(), aux_arrays);

  }


 private:

  Executor(const Executor& e);

  Executor& operator=(const Executor& e);

  CachedOpHandle handle_;

  Symbol symbol_;

  std::map<std::string, NDArray> GetDict(const std::vector<std::string>& names,

                                         const std::vector<NDArray>& arrays) {

    std::map<std::string, NDArray> ret;

    std::set<std::string> name_set;

    for (const auto& s : names) {

      CHECK(name_set.find(s) == name_set.end()) << "Duplicate names detected, " << s;

      name_set.insert(s);

    }

    CHECK_EQ(name_set.size(), arrays.size()) << "names size not equal to arrays size";

    for (size_t i = 0; i < names.size(); ++i) {

      ret[names[i]] = arrays[i];

    }

    return ret;

  }

};

}  // namespace cpp

}  // namespace mxnet

#endif  // MXNET_CPP_EXECUTOR_H_