1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one
3  * or more contributor license agreements. See the NOTICE file
4  * distributed with this work for additional information
5  * regarding copyright ownership. The ASF licenses this file
6  * to you under the Apache License, Version 2.0 (the
7  * "License"); you may not use this file except in compliance
8  * with the License. You may obtain a copy of the License at
9  *
10  *
11  *
12  * Unless required by applicable law or agreed to in writing,
13  * software distributed under the License is distributed on an
15  * KIND, either express or implied. See the License for the
16  * specific language governing permissions and limitations
17  * under the License.
18  */
29 #include <mshadow/tensor.h>
30 #include <nnvm/op_attr_types.h>
32 #include <vector>
33 #include <functional>
35 #include "./base.h"
36 #include "./ndarray.h"
37 #include "./engine.h"
38 #include "./resource.h"
40 namespace mxnet {
42 using nnvm::NodeAttrs;
45 enum OpReqType {
58 };
66 struct OpContext {
68  bool need_grad;
70  bool is_train;
76  std::vector<Resource> requested;
82  template<typename xpu>
83  inline mshadow::Stream<xpu>* get_stream() const {
84  return run_ctx.get_stream<xpu>();
85  }
86 };
89 enum class ExecType {
91  kSync,
96  kAsync,
109 };
112 enum class DispatchMode {
113  kUndefined = -1,
114  // dispatch on FCompute or FStatefulCompute
115  kFCompute,
116  // dispatch on FComputeEx or FStatefulComputeEx, if available
117  kFComputeEx,
118  // dispatch on FCompute or FStatefulCompute, and performs storage fallback
120  // special dispatch mode for variables
121  kVariable,
122 };
128 class OpStatePtr {
129  public:
130  /* \brief Create a OpStatePtr with state of type T.
131  * \param args Arguments passed to T's constructor.
132  */
133  template<typename T, typename... Args>
134  static OpStatePtr Create(Args&&... args) {
135  OpStatePtr ret;
136  auto state = new T(std::forward<Args>(args)...);
137  auto var = Engine::Get()->NewVariable();
138  ret.ptr_.reset(
139  new OpState(var, state),
140  [](OpState* p) {
141  Engine::Get()->DeleteVariable([](RunContext s) {}, Context::CPU(), p->var);
142  delete reinterpret_cast<T*>(p->state);
143  delete p;
144  });
146  return ret;
147  }
148  /* \brief Get engine variable associated with this state */
150  return ptr_->var;
151  }
152  /* \brief Get state of type T */
153  template<typename T>
154  T& get_state() const {
155  return *reinterpret_cast<T*>(ptr_->state);
156  }
157  /* \brief clear state */
158  void reset() {
159  ptr_.reset();
160  }
161  /* \brief checks whether the managed object is managed only by the current
162  OpStatePtr instance */
163  bool unique() const {
164  return ptr_.unique();
165  }
166  /* \brief Whether state is empty */
167  explicit operator bool() const {
168  return ptr_ ? true : false;
169  }
171  private:
172  /* \brief state structure */
173  struct OpState {
174  engine::VarHandle var;
175  void* state;
177  OpState(engine::VarHandle var_, void* state_) : var(var_), state(state_) {}
178  OpState(const OpState& other) = delete;
179  OpState& operator=(const OpState& other) = delete;
180  };
181  /* \brief shared pointer to state */
182  std::shared_ptr<OpState> ptr_;
183 };
197 using FCreateOpState = std::function<OpStatePtr (const NodeAttrs& attrs,
198  Context ctx,
199  const std::vector<TShape>& in_shape,
200  const std::vector<int>& in_type)>;
204 using FExecType = std::function<ExecType (const NodeAttrs& attrs)>;
212 using FStatefulCompute = std::function<void (const OpStatePtr& state,
213  const OpContext& ctx,
214  const std::vector<TBlob>& inputs,
215  const std::vector<OpReqType>& req,
216  const std::vector<TBlob>& outputs)>;
224 using FStatefulComputeEx = std::function<void (const OpStatePtr& state,
225  const OpContext& ctx,
226  const std::vector<NDArray>& inputs,
227  const std::vector<OpReqType>& req,
228  const std::vector<NDArray>& outputs)>;
235 using FResourceRequest = std::function<
236  std::vector<ResourceRequest> (const NodeAttrs& n)>;
243 using FResourceRequestEx = std::function<
244  std::vector<ResourceRequest> (const NodeAttrs& n,
245  const int dev_mask,
246  const DispatchMode dispatch_mode)>;
252 using FNDArrayFunction = std::function<void (const nnvm::NodeAttrs& attrs,
253  const std::vector<NDArray>& inputs,
254  std::vector<NDArray>* outputs)>;
260 using FCompute = std::function<void (const nnvm::NodeAttrs& attrs,
261  const OpContext& ctx,
262  const std::vector<TBlob>& inputs,
263  const std::vector<OpReqType>& req,
264  const std::vector<TBlob>& outputs)>;
270 using FComputeEx = std::function<void (const nnvm::NodeAttrs& attrs,
271  const OpContext& ctx,
272  const std::vector<NDArray>& inputs,
273  const std::vector<OpReqType>& req,
274  const std::vector<NDArray>& outputs)>;
282 using FInferStorageType = std::function<bool (const NodeAttrs& attrs,
283  const int dev_mask,
284  DispatchMode* dispatch_mode,
285  std::vector<int>* in_attrs,
286  std::vector<int>* out_attrs)>;
292 using FQuantizedOp = std::function<nnvm::NodePtr (const NodeAttrs& attrs)>;
300 using FNeedRequantize = std::function<bool (const NodeAttrs& attrs)>;
302 } // namespace mxnet
304 #endif // MXNET_OP_ATTR_TYPES_H_
