PaddlePaddle
diff --git a/‎paddle/fluid/operators/fused/fused_gemm_epilogue_op.cc‎
Lines changed: 17 additions & 196 deletions b/‎paddle/fluid/operators/fused/fused_gemm_epilogue_op.cc‎
Lines changed: 17 additions & 196 deletions
@@ -13,8 +13,11 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License. */
 
+#include "paddle/fluid/framework/infershape_utils.h"
 #include "paddle/fluid/framework/op_registry.h"
 #include "paddle/fluid/framework/op_version_registry.h"
+#include "paddle/phi/core/infermeta_utils.h"
+#include "paddle/phi/infermeta/fusion.h"
 #include "paddle/phi/kernels/funcs/fused_gemm_epilogue.h"
 
 namespace paddle {
@@ -25,107 +28,6 @@ class FusedGemmEpilogueOp : public framework::OperatorWithKernel {
   using framework::OperatorWithKernel::OperatorWithKernel;
 
  protected:
-  void InferShape(framework::InferShapeContext* ctx) const override {
-    OP_INOUT_CHECK(ctx->HasInput("X"), "Input", "X", "FusedGemmEpilogueOp");
-    OP_INOUT_CHECK(ctx->HasInput("Y"), "Input", "Y", "FusedGemmEpilogueOp");
-    OP_INOUT_CHECK(
-        ctx->HasInput("Bias"), "Output", "Bias", "FusedGemmEpilogueOp");
-    OP_INOUT_CHECK(
-        ctx->HasOutput("Out"), "Output", "Out", "FusedGemmEpilogueOp");
-
-    auto x_dims = ctx->GetInputDim("X");
-    auto y_dims = ctx->GetInputDim("Y");
-    auto bias_dims = ctx->GetInputDim("Bias");
-    auto trans_x = ctx->Attrs().Get<bool>("trans_x");
-    auto trans_y = ctx->Attrs().Get<bool>("trans_y");
-
-    PADDLE_ENFORCE_EQ(
-        y_dims.size(),
-        2,
-        platform::errors::InvalidArgument(
-            "The Input tensor Y's dimension of FusedGemmEpilogueOp "
-            " should be 2, but got %d.",
-            y_dims.size()));
-
-    PADDLE_ENFORCE_GE(
-        x_dims.size(),
-        2,
-        platform::errors::InvalidArgument(
-            "The Input tensor X's dimension of FusedGemmEpilogueOp "
-            " should be >= 2, but got %d.",
-            x_dims.size()));
-
-    PADDLE_ENFORCE_EQ(
-        bias_dims.size(),
-        1,
-        platform::errors::InvalidArgument(
-            "The Input tensor bias's dimension of FusedGemmEpilogueOp "
-            " should be == 1, but got %d.",
-            bias_dims.size()));
-
-    PADDLE_ENFORCE_EQ(bias_dims[0],
-                      trans_y ? y_dims[0] : y_dims[1],
-                      platform::errors::InvalidArgument(
-                          "The Input tensor bias's dimension 0"
-                          " should be == Y[-1], but got bias's shape = [%s] "
-                          "and Y's shape = [%s]",
-                          bias_dims,
-                          y_dims));
-
-    auto x_mat_dims =
-        common::flatten_to_2d(x_dims, trans_x ? 1 : x_dims.size() - 1);
-
-    int K_from_x = trans_x ? x_mat_dims[0] : x_mat_dims[1];
-    int K_from_y = trans_y ? y_dims[1] : y_dims[0];
-
-    PADDLE_ENFORCE_EQ(
-        K_from_x,
-        K_from_y,
-        platform::errors::InvalidArgument(
-            "The last dimension of X should be equal with Y's first dimension."
-            "But received X[-1] = [%d], Y[0] = [%d].",
-            K_from_x,
-            K_from_y));
-
-    std::vector<int64_t> out_dims;
-    out_dims.reserve(static_cast<size_t>(x_dims.size()));
-    if (trans_x) {
-      for (int i = 1; i < x_dims.size(); ++i) out_dims.push_back(x_dims[i]);
-    } else {
-      for (int i = 0; i < x_dims.size() - 1; ++i) out_dims.push_back(x_dims[i]);
-    }
-
-    if (trans_y) {
-      out_dims.push_back(y_dims[0]);
-    } else {
-      out_dims.push_back(y_dims[1]);
-    }
-    ctx->SetOutputDim("Out", common::make_ddim(out_dims));
-
-    auto activation = ctx->Attrs().Get<std::string>("activation");
-    if (ctx->HasOutput("ReserveSpace")) {
-      ctx->SetOutputDim("ReserveSpace", common::make_ddim(out_dims));
-
-      if (activation == "none") {
-        PADDLE_THROW(platform::errors::InvalidArgument(
-            "The ReserveSpace would not be used when activation = \"none\""));
-      } else {
-        int min_size_of_n = activation == "relu" ? 128 : 8;
-        int N_size = trans_y ? y_dims[0] : y_dims[1];
-        PADDLE_ENFORCE_EQ(
-            N_size % min_size_of_n,
-            0,
-            platform::errors::InvalidArgument(
-                "The output dimension N (X(MxK) * Y(KxN) = C(MxN)) "
-                "should be multiple of %d when auxiliary_key given "
-                "and activation=%s, but got N = %d.",
-                min_size_of_n,
-                activation,
-                N_size));
-      }
-    }
-  }
-
   phi::KernelKey GetExpectedKernelType(
       const framework::ExecutionContext& ctx) const override {
     auto data_type = OperatorWithKernel::IndicateVarDataType(ctx, "X");
@@ -188,94 +90,6 @@ class FusedGemmEpilogueGradOp : public framework::OperatorWithKernel {
   using framework::OperatorWithKernel::OperatorWithKernel;
 
  protected:
-  void InferShape(framework::InferShapeContext* ctx) const override {
-    OP_INOUT_CHECK(
-        ctx->HasInput("DOut"), "Input", "DOut", "FusedGemmEpilogueGradOp");
-    OP_INOUT_CHECK(ctx->HasInput("X"), "Input", "X", "FusedGemmEpilogueGradOp");
-    OP_INOUT_CHECK(ctx->HasInput("Y"), "Input", "Y", "FusedGemmEpilogueGradOp");
-    OP_INOUT_CHECK(ctx->HasOutput("DY"), "Output", "DY", "FusedGemmEpilogueOp");
-
-    auto dout_dims = ctx->GetInputDim("DOut");
-    auto x_dims = ctx->GetInputDim("X");
-    auto y_dims = ctx->GetInputDim("Y");
-    auto trans_x = ctx->Attrs().Get<bool>("trans_x");
-    auto trans_y = ctx->Attrs().Get<bool>("trans_y");
-
-    PADDLE_ENFORCE_GE(
-        dout_dims.size(),
-        2,
-        platform::errors::InvalidArgument(
-            "The Input tensor DOut's dimension of FusedGemmEpilogueGradOp "
-            " should be >= 2, but got %d.",
-            dout_dims.size()));
-
-    PADDLE_ENFORCE_EQ(
-        y_dims.size(),
-        2,
-        platform::errors::InvalidArgument(
-            "The Input tensor Y's dimension of FusedGemmEpilogueGradOp "
-            " should be 2, but got %d.",
-            y_dims.size()));
-
-    PADDLE_ENFORCE_GE(
-        x_dims.size(),
-        2,
-        platform::errors::InvalidArgument(
-            "The Input tensor X's dimension of FusedGemmEpilogueGradOp "
-            " should be >= 2, but got %d.",
-            x_dims.size()));
-
-    PADDLE_ENFORCE_EQ(
-        dout_dims.size(),
-        x_dims.size(),
-        platform::errors::InvalidArgument(
-            "The Input tensor DOut's and X's dimension of "
-            "FusedGemmEpilogueGradOp "
-            " should be the same, but got DOut's dim = %d and X's = %d.",
-            dout_dims.size(),
-            x_dims.size()));
-
-    auto dout_mat_dims = common::flatten_to_2d(dout_dims, dout_dims.size() - 1);
-    auto x_mat_dims = common::flatten_to_2d(x_dims, x_dims.size() - 1);
-
-    PADDLE_ENFORCE_EQ(
-        dout_mat_dims[1],
-        trans_y ? y_dims[0] : y_dims[1],
-        platform::errors::InvalidArgument(
-            "The last dimension of DOut should be equal with Y's last"
-            "dimension. But received DOut[-1] = [%d], Y[1] = [%d].",
-            dout_mat_dims[1],
-            y_dims[1]));
-
-    PADDLE_ENFORCE_EQ(
-        dout_mat_dims[0],
-        trans_x ? x_mat_dims[1] : x_mat_dims[0],
-        platform::errors::InvalidArgument(
-            "The first dimension of DOut should be equal with X's first"
-            "dimension. But received DOut[0] = [%d], Y[0] = [%d].",
-            dout_mat_dims[0],
-            x_mat_dims[0]));
-
-    auto activation_grad = ctx->Attrs().Get<std::string>("activation_grad");
-    if (activation_grad != "none" && !ctx->HasInput("ReserveSpace")) {
-      PADDLE_ENFORCE_EQ(true,
-                        false,
-                        platform::errors::InvalidArgument(
-                            "The ReserveSpace should not be empty. "
-                            "when activation == {relu_grad, gelu_grad}."));
-    }
-
-    if (ctx->HasOutput("DX")) {
-      ctx->SetOutputDim("DX", x_dims);
-    }
-    ctx->SetOutputDim("DY", y_dims);
-
-    if (ctx->HasOutput("DBias")) {
-      int64_t dbias_dim = trans_y ? y_dims[0] : y_dims[1];
-      ctx->SetOutputDim("DBias", common::make_ddim({dbias_dim}));
-    }
-  }
-
   phi::KernelKey GetExpectedKernelType(
       const framework::ExecutionContext& ctx) const override {
     auto data_type = OperatorWithKernel::IndicateVarDataType(ctx, "DOut");
@@ -367,12 +181,19 @@ class FusedGemmEpilogueOpGradMaker : public framework::SingleGradOpMaker<T> {
 }  // namespace paddle
 
 namespace ops = paddle::operators;
-REGISTER_OPERATOR(
-    fused_gemm_epilogue,
-    ops::FusedGemmEpilogueOp,
-    ops::FusedGemmEpilogueOpMaker,
-    ops::FusedGemmEpilogueOpGradMaker<paddle::framework::OpDesc>,
-    ops::FusedGemmEpilogueOpGradMaker<paddle::imperative::OpBase>);
+DECLARE_INFER_SHAPE_FUNCTOR(fused_gemm_epilogue,
+                            FusedGemmEpilogueInferShapeFunctor,
+                            PD_INFER_META(phi::FusedGemmEpilogueInferMeta));
+DECLARE_INFER_SHAPE_FUNCTOR(fused_gemm_epilogue_grad,
+                            FusedGemmEpilogueGradInferShapeFunctor,
+                            PD_INFER_META(phi::FusedGemmEpilogueGradInferMeta));
+REGISTER_OPERATOR(fused_gemm_epilogue,
+                  ops::FusedGemmEpilogueOp,
+                  ops::FusedGemmEpilogueOpMaker,
+                  ops::FusedGemmEpilogueOpGradMaker<paddle::framework::OpDesc>,
+                  ops::FusedGemmEpilogueOpGradMaker<paddle::imperative::OpBase>,
+                  FusedGemmEpilogueInferShapeFunctor);
 REGISTER_OPERATOR(fused_gemm_epilogue_grad,
                   ops::FusedGemmEpilogueGradOp,
-                  ops::FusedGemmEpilogueGradOpMaker);
+                  ops::FusedGemmEpilogueGradOpMaker,
+                  FusedGemmEpilogueGradInferShapeFunctor);