zhygit
diff --git a/‎CONTRIBUTORS.md
Lines changed: 1 addition & 0 deletions b/‎CONTRIBUTORS.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/operator/bilinear_sampler-inl.h
Lines changed: 205 additions & 0 deletions b/‎src/operator/bilinear_sampler-inl.h
Lines changed: 205 additions & 0 deletions
diff --git a/‎src/operator/bilinear_sampler.cc
Lines changed: 172 additions & 0 deletions b/‎src/operator/bilinear_sampler.cc
Lines changed: 172 additions & 0 deletions
@@ -120,3 +120,4 @@ List of Contributors
 * [Wei Wu](https://github.com/lazyparser)
 * [Shishi Duan](https://github.com/burness)
 * [Yu Du](https://github.com/Answeror)
+* [Xu Dong](https://github.com/dsqx71)
@@ -0,0 +1,205 @@
+/*!
+ * Copyright (c) 2017 by Contributors
+ * \file bilinear_Sampler-inl.h
+ * \brief
+ * \author Xu Dong
+*/
+#ifndef MXNET_OPERATOR_BILINEAR_SAMPLER_INL_H_
+#define MXNET_OPERATOR_BILINEAR_SAMPLER_INL_H_
+
+#include <dmlc/logging.h>
+#include <dmlc/parameter.h>
+#include <mxnet/operator.h>
+#include <vector>
+#include <map>
+#include <string>
+#include <utility>
+#include "./operator_common.h"
+
+namespace mxnet {
+namespace op {
+
+namespace bs {
+enum BilinearSamplerOpInputs {kData, kGrid};
+enum BilinearSamplerOpOutputs {kOut, kTmp};
+}
+
+struct BilinearSamplerParam : public dmlc::Parameter<BilinearSamplerParam> {
+  DMLC_DECLARE_PARAMETER(BilinearSamplerParam) {
+  }
+};
+
+template<typename xpu, typename DType>
+class BilinearSamplerOp : public Operator {
+ public:
+  explicit BilinearSamplerOp(BilinearSamplerParam p) {
+    this->param_ = p;
+  }
+
+  virtual void Forward(const OpContext &ctx,
+                       const std::vector<TBlob> &in_data,
+                       const std::vector<OpReqType> &req,
+                       const std::vector<TBlob> &out_data,
+                       const std::vector<TBlob> &aux_args) {
+    using namespace mshadow;
+    using namespace mshadow::expr;
+    CHECK_EQ(in_data.size(), 2);
+    Stream<xpu> *s = ctx.get_stream<xpu>();
+
+    Tensor<xpu, 4, DType> data = in_data[bs::kData].get<xpu, 4, DType>(s);
+    Tensor<xpu, 4, DType> grid = in_data[bs::kGrid].get<xpu, 4, DType>(s);
+    Tensor<xpu, 4, DType> out = out_data[bs::kOut].get<xpu, 4, DType>(s);
+
+    BilinearSamplerForward(out, data, grid);
+  }
+
+  virtual void Backward(const OpContext &ctx,
+                        const std::vector<TBlob> &out_grad,
+                        const std::vector<TBlob> &in_data,
+                        const std::vector<TBlob> &out_data,
+                        const std::vector<OpReqType> &req,
+                        const std::vector<TBlob> &in_grad,
+                        const std::vector<TBlob> &aux_args) {
+    using namespace mshadow;
+    using namespace mshadow::expr;
+    CHECK_EQ(in_data.size(), 2);
+    Stream<xpu> *s = ctx.get_stream<xpu>();
+
+    Tensor<xpu, 4, DType> data = in_data[bs::kData].get<xpu, 4, DType>(s);
+    Tensor<xpu, 4, DType> grid = in_data[bs::kGrid].get<xpu, 4, DType>(s);
+    Tensor<xpu, 4, DType> gdata = in_grad[bs::kData].get<xpu, 4, DType>(s);
+    Tensor<xpu, 4, DType> ggrid = in_grad[bs::kGrid].get<xpu, 4, DType>(s);
+    Tensor<xpu, 4, DType> grad = out_grad[bs::kOut].get<xpu, 4, DType>(s);
+    gdata = 0.0f;
+    ggrid = 0.0f;
+    BilinearSamplerBackward(gdata, ggrid, grad, data, grid);
+  }
+
+ private:
+  BilinearSamplerParam param_;
+};  // class BilinearSamplerOp
+
+template<typename xpu>
+Operator* CreateOp(BilinearSamplerParam param, int dtype);
+
+#if DMLC_USE_CXX11
+class BilinearSamplerProp : public OperatorProperty {
+ public:
+  int NumVisibleOutputs() const override {
+    return 1;
+  }
+
+  int NumOutputs() const override {
+    return 2;
+  }
+
+  std::vector<std::string> ListArguments() const override {
+    return {"data", "grid"};
+  }
+
+  std::vector<std::string> ListOutputs() const override {
+    return {"output", "tmp"};
+  }
+
+  void Init(const std::vector<std::pair<std::string, std::string> >& kwargs) override {
+    param_.Init(kwargs);
+  }
+
+  std::map<std::string, std::string> GetParams() const override {
+    return param_.__DICT__();
+  }
+
+  bool InferShape(std::vector<TShape> *in_shape,
+                  std::vector<TShape> *out_shape,
+                  std::vector<TShape> *aux_shape) const override {
+    using namespace mshadow;
+    CHECK_EQ(in_shape->size(), 2) << "Input:[data, grid]";
+    const TShape &dshape = (*in_shape)[bs::kData];
+    const TShape &lshape = (*in_shape)[bs::kGrid];
+    if (dshape.ndim() == 0) return false;
+    CHECK_EQ(dshape.ndim(), 4) \
+        << "input data should be 4D in batch-num_filter-y-x";
+    if (lshape.ndim() ==  0) return false;
+    CHECK_EQ(lshape.ndim(), 4) \
+      << "Sampler grid should be 4D in batch-2-y-x";
+    CHECK_EQ(dshape[0], lshape[0]);
+    CHECK_EQ(lshape[1], 2) << "incorrect grid shape[1], should be 2";
+    // target height
+    CHECK_GT(lshape[2], 0) \
+            << "incorrect grid_shape: " << lshape[2];
+    // target width
+    CHECK_GT(lshape[3], 0) \
+        << "incorrect grid_shape: " << lshape[3];
+    out_shape->clear();
+    // output_shape : (data.shape[0], data.shape[1], grid.shape[2], grid.shape[3])
+    out_shape->push_back(dshape);
+    (*out_shape)[bs::kOut][2] = lshape[2];
+    (*out_shape)[bs::kOut][3] = lshape[3];
+    out_shape->push_back(Shape4(lshape[0], lshape[2], lshape[3], 2));
+    return true;
+  }
+
+  bool InferType(std::vector<int> *in_type,
+                   std::vector<int> *out_type,
+                   std::vector<int> *aux_type) const override {
+      int dtype = -1;
+      for (size_t i = 0; i < in_type->size(); ++i) {
+        if (dtype == -1) {
+          dtype = in_type->at(i);
+        } else {
+          CHECK(in_type->at(i) == dtype ||
+                in_type->at(i) == -1) <<
+                "Non-uniform data type in BilinearSampler";
+        }
+      }
+      if (dtype == -1) {
+        LOG(FATAL) << "Not enough information to infer type in BilinearSampler.";
+        return false;
+      }
+      size_t nin = this->ListArguments().size();
+      in_type->clear();
+      for (size_t i = 0; i < nin; ++i) in_type->push_back(dtype);
+      size_t naux = this->ListAuxiliaryStates().size();
+      aux_type->clear();
+      for (size_t i = 0; i < naux; ++i) aux_type->push_back(dtype);
+      size_t nout = this->ListOutputs().size();
+      out_type->clear();
+      for (size_t i = 0; i < nout; ++i) out_type->push_back(dtype);
+      return true;
+    }
+
+  OperatorProperty* Copy() const override {
+    auto ptr = new BilinearSamplerProp();
+    ptr->param_ = param_;
+    return ptr;
+  }
+
+  std::string TypeString() const override {
+    return "BilinearSampler";
+  }
+
+  std::vector<int> DeclareBackwardDependency(
+    const std::vector<int> &out_grad,
+    const std::vector<int> &in_data,
+    const std::vector<int> &out_data) const override {
+    return {out_grad[bs::kOut],
+            in_data[bs::kData],
+            out_data[bs::kTmp],
+            in_data[bs::kGrid]};
+  }
+
+  Operator* CreateOperator(Context ctx) const override {
+    LOG(FATAL) << "Not Implemented.";
+    return NULL;
+  }
+
+  Operator* CreateOperatorEx(Context ctx, std::vector<TShape> *in_shape,
+                             std::vector<int> *in_type) const override;
+
+ private:
+  BilinearSamplerParam param_;
+};  // class BilinearSamplerProp
+#endif  // DMLC_USE_CXX11
+}  // namespace op
+}  // namespace mxnet
+#endif  // MXNET_OPERATOR_BILINEAR_SAMPLER_INL_H_
@@ -0,0 +1,172 @@
+/*!
+ * Copyright (c) 2017 by Contributors
+ * \file bilinear_sampler.cc
+ * \brief
+ * \author Xu Dong
+*/
+
+#include "./bilinear_sampler-inl.h"
+
+namespace mshadow {
+template<typename DType>
+bool between(DType value, int lowerBound, int upperBound) {
+  return (value >= lowerBound && value <= upperBound);
+}
+template<typename DType>
+inline void BilinearSamplerForward(const Tensor<cpu, 4, DType> &output,
+                                    const Tensor<cpu, 4, DType> &input,
+                                    const Tensor<cpu, 4, DType> &grid_src) {
+  DType *out = output.dptr_;
+  const DType *data = input.dptr_;
+  const DType *grid = grid_src.dptr_;
+  int o_n = output.size(0), o_c = output.size(1), o_h = output.size(2), o_w = output.size(3);
+  int i_c = input.size(1), i_h = input.size(2), i_w = input.size(3);
+  for (index_t n = 0; n < o_n; ++n) {
+    for (index_t c = 0; c < o_c; ++c) {
+      for (index_t h = 0; h < o_h; ++h) {
+        for (index_t w = 0; w < o_w; ++w) {
+          index_t out_index = n * o_c * o_h * o_w + c * o_h * o_w + h * o_w + w;
+          index_t grid_index = n * o_h * o_w * 2 + h * o_w + w;
+          DType y_real = (*(grid + grid_index + o_h * o_w) + 1) * (i_h - 1) / 2;
+          DType x_real = (*(grid + grid_index) + 1) * (i_w - 1) / 2;
+          index_t top_left_y = static_cast<int>(floor(y_real));
+          index_t top_left_x = static_cast<int>(floor(x_real));
+          DType top_left_y_w = 1.0 - (y_real - top_left_y);
+          DType top_left_x_w = 1.0 - (x_real - top_left_x);
+          index_t data_index = n * i_c * i_h * i_w + c * i_h * i_w +
+            top_left_y * i_w + top_left_x;
+          DType top_left_v = 0;
+          DType top_right_v = 0;
+          DType bottom_left_v = 0;
+          DType bottom_right_v = 0;
+          if (between(top_left_x, 0, i_w-1) && between(top_left_y, 0, i_h-1))
+            top_left_v = *(data + data_index);
+          if (between(top_left_x + 1, 0, i_w-1) && between(top_left_y, 0, i_h-1))
+            top_right_v = *(data + data_index + 1);
+          if (between(top_left_x, 0, i_w-1) && between(top_left_y + 1, 0, i_h-1))
+            bottom_left_v = *(data + data_index + i_w);
+          if (between(top_left_x+1, 0, i_w-1) && between(top_left_y + 1, 0, i_h-1))
+            bottom_right_v = *(data + data_index + i_w + 1);
+          *(out+out_index) = top_left_v * top_left_y_w * top_left_x_w +
+                              top_right_v * top_left_y_w * (1.0 - top_left_x_w) +
+                              bottom_left_v * (1.0 - top_left_y_w) * top_left_x_w +
+                              bottom_right_v * (1.0 - top_left_y_w) * (1.0 - top_left_x_w);
+        }
+      }
+    }
+  }
+}
+
+template<typename DType>
+inline void BilinearSamplerBackward(const Tensor<cpu, 4, DType> &gdata,
+                                     const Tensor<cpu, 4, DType> &ggrid,
+                                     const Tensor<cpu, 4, DType> &output_grad,
+                                     const Tensor<cpu, 4, DType> &input_data,
+                                     const Tensor<cpu, 4, DType> &grid) {
+  DType *g_input = gdata.dptr_;
+  DType *grad_grid = ggrid.dptr_;
+  const DType *grid_src = grid.dptr_;
+  const DType *grad = output_grad.dptr_;
+  const DType *data = input_data.dptr_;
+  int o_n = output_grad.size(0), o_c = output_grad.size(1),
+      o_h = output_grad.size(2), o_w = output_grad.size(3);
+  int i_c = input_data.size(1), i_h = input_data.size(2), i_w = input_data.size(3);
+  for (index_t n = 0; n < o_n; ++n) {
+     for (index_t h = 0; h < o_h; ++h) {
+        for (index_t w = 0; w < o_w; ++w) {
+          DType top_left_y_gw = 0.0;
+          DType top_left_x_gw = 0.0;
+          index_t grid_src_index = n * o_h * o_w * 2 + h * o_w + w;
+          DType y_real = (*(grid_src + grid_src_index + o_h * o_w) + 1) * (i_h - 1) / 2;
+          DType x_real = (*(grid_src + grid_src_index) + 1) * (i_w - 1) / 2;
+          index_t top_left_y = static_cast<int>(floor(y_real));
+          index_t top_left_x = static_cast<int>(floor(x_real));
+          DType top_left_y_w = 1.0 - (y_real - top_left_y);
+          DType top_left_x_w = 1.0 - (x_real - top_left_x);
+          for (index_t c = 0; c < o_c; ++c) {
+            index_t grad_index = n * o_c * o_h * o_w + c * o_h * o_w + h * o_w + w;
+            index_t data_index = n * i_c * i_h * i_w + c * i_h * i_w + top_left_y * i_w
+                                  + top_left_x;
+            // calc 4 vertex value in input data
+            DType top_left_v = 0;
+            DType top_right_v = 0;
+            DType bottom_left_v = 0;
+            DType bottom_right_v = 0;
+            // calc input grad
+            if (between(top_left_x, 0, i_w-1) && between(top_left_y, 0, i_h-1)) {
+              *(g_input + data_index) += *(grad + grad_index) * top_left_y_w * top_left_x_w;
+              top_left_v = *(data + data_index);
+            }
+            if (between(top_left_x+1, 0, i_w-1) && between(top_left_y, 0, i_h-1)) {
+              *(g_input + data_index + 1) += *(grad + grad_index) * top_left_y_w
+                                              * (1.0 - top_left_x_w);
+              top_right_v = *(data + data_index + 1);
+            }
+            if (between(top_left_x, 0, i_w-1) && between(top_left_y+1, 0, i_h-1)) {
+              *(g_input + data_index+ i_w) += *(grad + grad_index) * (1.0 - top_left_y_w)
+                                              * top_left_x_w;
+              bottom_left_v = *(data + data_index + i_w);
+            }
+            if (between(top_left_x+1, 0, i_w-1) && between(top_left_y+1, 0, i_h-1)) {
+              *(g_input + data_index+ i_w + 1) += *(grad + grad_index) * (1.0 - top_left_y_w)
+                                                  * (1.0 - top_left_x_w);
+              bottom_right_v = *(data + data_index + i_w + 1);
+            }
+            // calc weight grad of top_left_w, then multiple -1 is the grad of grid_src
+            top_left_y_gw -= *(grad + grad_index) * (top_right_v - bottom_right_v +
+                              (top_left_v - top_right_v - bottom_left_v + bottom_right_v)
+                              * top_left_x_w);
+            top_left_x_gw -= *(grad + grad_index) * (bottom_left_v - bottom_right_v +
+                              (top_left_v - top_right_v - bottom_left_v + bottom_right_v)
+                              * top_left_y_w);
+          }
+          // calc grad of grid
+          *(grad_grid + grid_src_index + o_h * o_w) = top_left_y_gw * (i_h - 1) / 2;
+          *(grad_grid + grid_src_index) = top_left_x_gw * (i_w - 1) / 2;
+        }
+      }
+    }
+  }
+}  // namespace mshadow
+
+namespace mxnet {
+namespace op {
+template<>
+Operator* CreateOp<cpu>(BilinearSamplerParam param, int dtype) {
+  Operator *op = NULL;
+  MSHADOW_REAL_TYPE_SWITCH(dtype, DType, {
+    op = new BilinearSamplerOp<cpu, DType>(param);
+  })
+  return op;
+}
+
+Operator *BilinearSamplerProp::CreateOperatorEx(Context ctx, std::vector<TShape> *in_shape,
+                                     std::vector<int> *in_type) const {
+  std::vector<TShape> out_shape, aux_shape;
+  std::vector<int> out_type, aux_type;
+  CHECK(InferType(in_type, &out_type, &aux_type));
+  CHECK(InferShape(in_shape, &out_shape, &aux_shape));
+  DO_BIND_DISPATCH(CreateOp, param_, (*in_type)[0]);
+}
+
+DMLC_REGISTER_PARAMETER(BilinearSamplerParam);
+
+MXNET_REGISTER_OP_PROPERTY(BilinearSampler, BilinearSamplerProp)
+.add_argument("data", "Symbol", "Input data to the BilinearsamplerOp.")
+.add_argument("grid", "Symbol", "Input grid to the BilinearsamplerOp."
+                                "grid has two channels: x_src, y_src")
+.add_arguments(BilinearSamplerParam::__FIELDS__())
+.describe("Apply bilinear sampling to input feature map.\n    "
+"output[batch, channel, y_dst, x_dst] = G(data[batch, channel, y_src, x_src)\n    "
+"x_dst, y_dst enumerate all spatial locations in output\n    "
+"x_src = grid[batch, 0, y_dst, x_dst]\n    "
+"y_src = grid[batch, 1, y_dst, x_dst]\n    "
+"G() denotes the bilinear interpolation kernel\n"
+"If (x_src, y_src) is beyond the boundaries of input data,"
+"the results of forward and backward are zeros.\n"
+"The shape of output will be (data.shape[0], data.shape[1], grid.shape[2], grid.shape[3])\n"
+"The operator assumes that grid has been nomalized. "
+"If you want to design a CustomOp to manipulate grid, "
+"please refer to GridGeneratorOp.");
+}  // namespace op
+}  // namespace mxnet