PaddlePaddle · jacquesqiao · Aug 1, 2017 · Jul 23, 2017 · Jul 24, 2017 · Jul 24, 2017
diff --git a/paddle/framework/net.h b/paddle/framework/net.h
@@ -57,9 +57,9 @@ class PlainNet : public Net {
    * Infer all the operators' input and output variables' shapes, will be called
    * before every mini-batch
    */
-  void InferShape(const std::shared_ptr<Scope>& scope) const override {
+  void InferShapeImpl(const InferShapeContext& ctx) const override {
     for (auto& op : ops_) {
-      op->InferShape(scope);
+      op->InferShape(ctx.scope_);
     }
   }
 

diff --git a/paddle/framework/net_op_test.cc b/paddle/framework/net_op_test.cc
@@ -16,8 +16,8 @@ static int run_cnt = 0;
 
 class TestOp : public OperatorBase {
  public:
-  void InferShape(
-      const std::shared_ptr<framework::Scope>& scope) const override {
+  void InferShapeImpl(
+      const paddle::framework::InferShapeContext& ctx) const override {
     ++infer_shape_cnt;
   }
   void Run(const std::shared_ptr<framework::Scope>& scope,

diff --git a/paddle/framework/op_registry_test.cc b/paddle/framework/op_registry_test.cc
@@ -9,7 +9,7 @@ class CosineOp : public OperatorBase {
  public:
   void Run(const std::shared_ptr<Scope>& scope,
            const platform::DeviceContext& dev_ctx) const override {}
-  void InferShape(const std::shared_ptr<Scope>& scope) const override {}
+  void InferShapeImpl(const InferShapeContext& ctx) const override {}
 };
 
 class CosineOpProtoAndCheckerMaker : public OpProtoAndCheckerMaker {
@@ -27,7 +27,7 @@ class CosineOpProtoAndCheckerMaker : public OpProtoAndCheckerMaker {
 
 class MyTestOp : public OperatorBase {
  public:
-  void InferShape(const std::shared_ptr<Scope>& scope) const override {}
+  void InferShapeImpl(const InferShapeContext& ctx) const override {}
   void Run(const std::shared_ptr<Scope>& scope,
            const platform::DeviceContext& dev_ctx) const override {}
 };

diff --git a/paddle/framework/operator.cc b/paddle/framework/operator.cc
@@ -79,6 +79,10 @@ std::vector<std::string> OperatorBase::Outputs(const std::string& name) const {
       outputs_.begin() + output_format.at(offset + 1)};
 }
 
+void OperatorBase::InferShape(const std::shared_ptr<Scope>& scope) const {
+  InferShapeImpl(InferShapeContext(this, scope));
+}
+
 std::string OperatorBase::DebugString() const {
   std::stringstream ss;
   ss << "Op(" << type_ << "), inputs:(";

diff --git a/paddle/framework/operator.h b/paddle/framework/operator.h
@@ -31,22 +31,9 @@ limitations under the License. */
 namespace paddle {
 namespace framework {
 
-template <typename T>
-struct EigenDeviceConverter;
-
-template <>
-struct EigenDeviceConverter<platform::CPUPlace> {
-  using EigenDeviceType = Eigen::DefaultDevice;
-};
-
-#ifndef PADDLE_ONLY_CPU
-template <>
-struct EigenDeviceConverter<platform::GPUPlace> {
-  using EigenDeviceType = Eigen::GpuDevice;
-};
-#endif
-
 class OperatorBase;
+class InferShapeContext;
+class KernelContext;
 /**
  * OperatorBase has the basic element that Net will call to do computation.
  * Only CreateOperator from OpRegistry will new Operator directly. User
@@ -84,7 +71,8 @@ class OperatorBase {
 
   /// InferShape infer the size of Variables used by this Operator with
   /// information inside scope
-  virtual void InferShape(const std::shared_ptr<Scope>& scope) const = 0;
+  virtual void InferShape(const std::shared_ptr<Scope>& scope) const final;
+  virtual void InferShapeImpl(const InferShapeContext& ctx) const = 0;
 
   /// Net will call this function to Run an op.
   virtual void Run(const std::shared_ptr<Scope>& scope,
@@ -110,29 +98,32 @@ class OperatorBase {
   std::shared_ptr<std::unordered_map<std::string, int>> in_out_idxs_;
 };
 
-class KernelContext {
+class OperatorContext {
  public:
-  KernelContext(const OperatorBase* op, const std::shared_ptr<Scope>& scope,
-                const platform::DeviceContext& device_context)
-      : op_(*op), scope_(scope), device_context_(device_context) {}
+  OperatorContext(const OperatorBase* op, const std::shared_ptr<Scope>& scope)
+      : op_(*op), scope_(scope) {}
+
+  int InputSize() const { return static_cast<int>(op_.inputs_.size()); }
 
-  const Variable* Input(int index) const {
+  int OutputSize() const { return static_cast<int>(op_.outputs_.size()); }
+
+  const Variable* InputVar(int index) const {
     return scope_->GetVariable(op_.inputs_[index]);
   }
 
-  Variable* Output(int index) const {
+  Variable* OutputVar(int index) const {
     return scope_->GetVariable(op_.outputs_[index]);
   }
 
-  const Variable* Input(const std::string& name) const {
+  const Variable* InputVar(const std::string& name) const {
     return scope_->GetVariable(op_.Input(name));
   }
 
-  const Variable* Output(const std::string& name) const {
+  Variable* OutputVar(const std::string& name) const {
     return scope_->GetVariable(op_.Output(name));
   }
 
-  const std::vector<const Variable*> Inputs(const std::string& name) const {
+  const std::vector<const Variable*> InputVars(const std::string& name) const {
     auto names = op_.Inputs(name);
     std::vector<const Variable*> res;
     std::transform(
@@ -141,7 +132,7 @@ class KernelContext {
     return res;
   }
 
-  const std::vector<const Variable*> Outputs(const std::string& name) const {
+  const std::vector<const Variable*> OutputVars(const std::string& name) const {
     auto names = op_.Outputs(name);
     std::vector<const Variable*> res;
     std::transform(
@@ -150,15 +141,80 @@ class KernelContext {
     return res;
   }
 
+  const Tensor& Input(int index) const {
+    return InputVar(index)->Get<Tensor>();
+  }
+
+  Tensor* Output(int index) const {
+    return OutputVar(index)->GetMutable<Tensor>();
+  }
+
+  const Tensor& Input(const std::string& name) const {
+    return InputVar(name)->Get<Tensor>();
+  }
+
+  Tensor* Output(const std::string& name) const {
+    return OutputVar(name)->GetMutable<Tensor>();
+  }
+
+  const std::vector<const Tensor*> Inputs(const std::string& name) const {
+    auto names = op_.Inputs(name);
+    std::vector<const Tensor*> res;
+    std::transform(names.begin(), names.end(), res.begin(),
+                   [this](const std::string& name) {
+                     return &scope_->GetVariable(name)->Get<Tensor>();
+                   });
+    return res;
+  }
+
+  std::vector<const Tensor*> Outputs(const std::string& name) const {
+    auto names = op_.Outputs(name);
+    std::vector<const Tensor*> res;
+    std::transform(names.begin(), names.end(), res.begin(),
+                   [this](const std::string& name) {
+                     return scope_->GetVariable(name)->GetMutable<Tensor>();
+                   });
+    return res;
+  }
+
+  const OperatorBase& op_;
+  const std::shared_ptr<Scope>& scope_;
+};
+
+class InferShapeContext : public OperatorContext {
+ public:
+  InferShapeContext(const OperatorBase* op, const std::shared_ptr<Scope>& scope)
+      : OperatorContext(op, scope) {}
+};
+
+template <typename T>
+struct EigenDeviceConverter;
+
+template <>
+struct EigenDeviceConverter<platform::CPUPlace> {
+  using EigenDeviceType = Eigen::DefaultDevice;
+};
+
+#ifndef PADDLE_ONLY_CPU
+template <>
+struct EigenDeviceConverter<platform::GPUPlace> {
+  using EigenDeviceType = Eigen::GpuDevice;
+};
+#endif
+
+class KernelContext : public OperatorContext {
+ public:
+  KernelContext(const OperatorBase* op, const std::shared_ptr<Scope>& scope,
+                const platform::DeviceContext& device_context)
+      : OperatorContext(op, scope), device_context_(device_context) {}
+
   template <typename PlaceType,
             typename DeviceType =
                 typename EigenDeviceConverter<PlaceType>::EigenDeviceType>
   DeviceType* GetEigenDevice() const;
 
   platform::Place GetPlace() const { return device_context_.GetPlace(); }
 
-  const OperatorBase& op_;
-  const std::shared_ptr<Scope>& scope_;
   const platform::DeviceContext& device_context_;
 };
 
@@ -176,19 +232,6 @@ class OpKernel {
   virtual ~OpKernel() {}
 };
 
-template <typename T>
-struct VarToTensor {};
-
-template <>
-struct VarToTensor<Tensor*> {
-  Tensor* operator()(Variable* var) { return var->GetMutable<Tensor>(); }
-};
-
-template <>
-struct VarToTensor<const Tensor*> {
-  const Tensor* operator()(Variable* var) { return &var->Get<Tensor>(); }
-};
-
 class OperatorWithKernel : public OperatorBase {
  public:
   struct OpKernelKey {
@@ -223,35 +266,6 @@ class OperatorWithKernel : public OperatorBase {
     static std::unordered_map<std::string, OpKernelMap> g_all_op_kernels;
     return g_all_op_kernels;
   }
-
-  void InferShape(const std::shared_ptr<Scope>& scope) const final {
-    std::vector<const Tensor*> ins;
-    VarNamesToTensors(scope, inputs_, &ins);
-    std::vector<Tensor*> outs;
-    VarNamesToTensors(scope, outputs_, &outs);
-    InferShape(ins, outs);
-  };
-
- private:
-  template <typename T>
-  void VarNamesToTensors(const std::shared_ptr<Scope>& scope,
-                         const std::vector<std::string>& var_names,
-                         std::vector<T>* container) const {
-    container->reserve(var_names.size());
-    VarToTensor<T> convert;
-    for (auto& name : var_names) {
-      auto var = scope->GetVariable(name);
-      if (var != nullptr) {
-        container->push_back(convert(var));
-      } else {
-        container->push_back(nullptr);
-      }
-    }
-  }
-
- protected:
-  virtual void InferShape(const std::vector<const Tensor*>& inputs,
-                          const std::vector<Tensor*>& outputs) const = 0;
 };
 
 }  // namespace framework

diff --git a/paddle/framework/operator_test.cc b/paddle/framework/operator_test.cc
@@ -24,7 +24,7 @@ static int op_run_num = 0;
 class OpWithoutKernelTest : public OperatorBase {
  public:
   void Init() override { x = 1; }
-  void InferShape(const std::shared_ptr<Scope>& scope) const override {}
+  void InferShapeImpl(const framework::InferShapeContext& ctx) const override {}
   void Run(const std::shared_ptr<Scope>& scope,
            const platform::DeviceContext& dev_ctx) const override {
     op_run_num++;
@@ -73,6 +73,7 @@ TEST(OperatorBase, all) {
   auto op = paddle::framework::OpRegistry::CreateOp(op_desc);
   scope->CreateVariable("OUT1");
   ASSERT_EQ(paddle::framework::op_run_num, 0);
+  op->InferShape(scope);
   op->Run(scope, device_context);
   ASSERT_EQ(paddle::framework::op_run_num, 1);
 }
@@ -97,8 +98,7 @@ static int cpu_kernel_run_num = 0;
 
 class OpWithKernelTest : public OperatorWithKernel {
  protected:
-  void InferShape(const std::vector<const Tensor*>& inputs,
-                  const std::vector<Tensor*>& outputs) const override {}
+  void InferShapeImpl(const framework::InferShapeContext& ctx) const override {}
 };
 
 template <typename T1, typename T2>
@@ -117,7 +117,7 @@ class CPUKernelTest : public OpKernel {
 class OperatorMultiInputsTest : public OperatorBase {
  public:
   void Init() override { x = 1; }
-  void InferShape(const std::shared_ptr<Scope>& scope) const override {}
+  void InferShapeImpl(const framework::InferShapeContext& ctx) const override {}
   void Run(const std::shared_ptr<Scope>& scope,
            const platform::DeviceContext& dev_ctx) const override {
     ASSERT_EQ(scope->GetVariable(inputs_[0]), nullptr);

diff --git a/paddle/operators/add_op.cc b/paddle/operators/add_op.cc
@@ -21,17 +21,16 @@ namespace operators {
 
 class AddOp : public framework::OperatorWithKernel {
 protected:
-  void InferShape(
-      const std::vector<const framework::Tensor *> &inputs,
-      const std::vector<framework::Tensor *> &outputs) const override {
-    PADDLE_ENFORCE(inputs.size() == 2, "Input size of AddOp must be two");
-    PADDLE_ENFORCE(outputs.size() == 1, "Output size of AddOp must be one");
-    PADDLE_ENFORCE(
-        inputs[0] != nullptr && inputs[1] != nullptr && outputs[0] != nullptr,
-        "Inputs/Outputs of AddOp must all be set");
-    PADDLE_ENFORCE(inputs[0]->dims() == inputs[1]->dims(),
+  void InferShapeImpl(const framework::InferShapeContext &ctx) const override {
+    PADDLE_ENFORCE(ctx.InputSize() == 2, "Input size of AddOp must be two");
+    PADDLE_ENFORCE(ctx.OutputSize() == 1, "Output size of AddOp must be one");
+    PADDLE_ENFORCE(ctx.InputVar(0) != nullptr && ctx.InputVar(1) != nullptr,
+                   "Inputs of AddOp must all be set");
+    PADDLE_ENFORCE(ctx.OutputVar(0) != nullptr,
+                   "Outputs of AddOp must all be set");
+    PADDLE_ENFORCE(ctx.Input(0).dims() == ctx.Input(1).dims(),
                    "Two input of Add Op's dimension must be same.");
-    outputs[0]->Resize(inputs[0]->dims());
+    ctx.Output(0)->Resize(ctx.Input(0).dims());
   }
 };
 
@@ -52,9 +51,7 @@ The equation is: Out = X + Y
 
 class AddOpGrad : public framework::OperatorWithKernel {
 protected:
-  void InferShape(
-      const std::vector<const framework::Tensor *> &inputs,
-      const std::vector<framework::Tensor *> &outputs) const override {}
+  void InferShapeImpl(const framework::InferShapeContext &ctx) const override {}
   std::string DebugString() const override {
     LOG(INFO) << "AddOpGrad";
     return "";

diff --git a/paddle/operators/add_op.h b/paddle/operators/add_op.h
@@ -24,9 +24,9 @@ template <typename Place, typename T>
 class AddKernel : public framework::OpKernel {
 public:
   void Compute(const framework::KernelContext& context) const override {
-    auto input0 = context.Input(0)->Get<framework::Tensor>();
-    auto input1 = context.Input(1)->Get<framework::Tensor>();
-    auto* output = context.Output(0)->GetMutable<framework::Tensor>();
+    auto input0 = context.Input(0);
+    auto input1 = context.Input(1);
+    auto* output = context.Output(0);
 
     output->mutable_data<T>(context.GetPlace());
 

diff --git a/paddle/operators/cross_entropy_op.cc b/paddle/operators/cross_entropy_op.cc
@@ -21,21 +21,19 @@ namespace operators {
 
 class OnehotCrossEntropyOp : public framework::OperatorWithKernel {
 protected:
-  void InferShape(
-      const std::vector<const framework::Tensor *> &inputs,
-      const std::vector<framework::Tensor *> &outputs) const override {
-    PADDLE_ENFORCE(inputs.size() == 2,
+  void InferShapeImpl(const framework::InferShapeContext &ctx) const override {
+    PADDLE_ENFORCE(ctx.InputSize() == 2,
                    "Input size of OnehotCrossEntropyOp must be two");
-    PADDLE_ENFORCE(outputs.size() == 1,
+    PADDLE_ENFORCE(ctx.OutputSize() == 1,
                    "Output size of OnehotCrossEntropyOp must be one");
-    PADDLE_ENFORCE(inputs[0] != nullptr && inputs[1] != nullptr,
+    PADDLE_ENFORCE(ctx.InputVar(0) != nullptr && ctx.InputVar(1) != nullptr,
                    "Inputs of OnehotCrossEntropyOp must all be set");
-    PADDLE_ENFORCE(outputs[0] != nullptr,
+    PADDLE_ENFORCE(ctx.OutputVar(0) != nullptr,
                    "Outputs of OnehotCrossEntropyOp must all be set");
-    PADDLE_ENFORCE(inputs[0]->dims().size() == 2, "X's dimension must be 2.");
-    PADDLE_ENFORCE(outputs[0]->dims().size() == 1,
+    PADDLE_ENFORCE(ctx.Input(0).dims().size() == 2, "X's dimension must be 2.");
+    PADDLE_ENFORCE(ctx.Output(0)->dims().size() == 1,
                    "label's dimension must be 1.");
-    outputs[0]->Resize(framework::make_ddim({inputs[0]->dims()[0]}));
+    ctx.Output(0)->Resize(framework::make_ddim({ctx.Input(0).dims()[0]}));
   }
 };