Samsung
diff --git a/‎runtime/onert/api/nnfw/src/nnfw_session.cc
Lines changed: 11 additions & 59 deletions b/‎runtime/onert/api/nnfw/src/nnfw_session.cc
Lines changed: 11 additions & 59 deletions
diff --git a/‎runtime/onert/core/include/exec/Execution.h
Lines changed: 16 additions & 33 deletions b/‎runtime/onert/core/include/exec/Execution.h
Lines changed: 16 additions & 33 deletions
diff --git a/‎runtime/onert/core/include/exec/ExecutionContext.h
Lines changed: 2 additions & 2 deletions b/‎runtime/onert/core/include/exec/ExecutionContext.h
Lines changed: 2 additions & 2 deletions
diff --git a/‎runtime/onert/core/include/exec/IExecutors.h
Lines changed: 3 additions & 3 deletions b/‎runtime/onert/core/include/exec/IExecutors.h
Lines changed: 3 additions & 3 deletions
diff --git a/‎runtime/onert/core/src/exec/Execution.cc
Lines changed: 11 additions & 66 deletions b/‎runtime/onert/core/src/exec/Execution.cc
Lines changed: 11 additions & 66 deletions
diff --git a/‎runtime/onert/core/src/exec/Execution.test.cc
Lines changed: 8 additions & 9 deletions b/‎runtime/onert/core/src/exec/Execution.test.cc
Lines changed: 8 additions & 9 deletions
@@ -815,7 +815,7 @@ NNFW_STATUS nnfw_session::input_tensorinfo(uint32_t index, nnfw_tensorinfo *ti)
     }
     else
     {
-      const auto &info = _execution->getInputInfo(index);
+      const auto &info = _execution->inputInfo(index);
       fillTensorInfo(ti, info.shape(), info.typeInfo().type());
     }
   }
@@ -855,10 +855,8 @@ NNFW_STATUS nnfw_session::output_tensorinfo(uint32_t index, nnfw_tensorinfo *ti)
     }
     else
     {
-      auto io_index = onert::ir::IOIndex{index};
-      auto shape = _execution->getOutputShape(io_index);
-      auto dtype = _compiler_artifact->_executors->outputInfo(io_index).typeInfo().type();
-      fillTensorInfo(ti, shape, dtype);
+      auto info = _execution->outputInfo(index);
+      fillTensorInfo(ti, info.shape(), info.typeInfo().type());
     }
   }
   catch (const std::exception &e)
@@ -1562,7 +1560,7 @@ NNFW_STATUS nnfw_session::train_set_input(uint32_t index, const void *input,
   try
   {
     auto ind = onert::ir::IOIndex(index);
-    auto size = _execution->getInputTotalSize(ind);
+    auto size = _execution->inputInfo(index).total_size();
     if (input_tensorinfo && getBufSize(input_tensorinfo) != size)
     {
       std::cerr
@@ -1607,8 +1605,7 @@ NNFW_STATUS nnfw_session::train_set_expected(uint32_t index, const void *expecte
 
   try
   {
-    auto output_ind = onert::ir::IOIndex(index);
-    auto size = _execution->getOutputTotalSize(output_ind);
+    auto size = _execution->outputInfo(index).total_size();
     if (expected_tensorinfo && getBufSize(expected_tensorinfo) != size)
     {
       std::cerr << "Error during nnfw_session::train_set_expected : invalid tensorinfo"
@@ -2285,28 +2282,16 @@ NNFW_STATUS nnfw_session::run_with_auto_compilation(const char *target, NNFW_COD
       std::vector<void *> _output_buffers;
 
       using namespace onert::ir;
-      // Save Inputs buffers, set compile option to use float type
-      for (auto input_index = IOIndex{0}; input_index < IOIndex{input_size}; input_index++)
-      {
-        auto input_Shape = _execution->getInputShape(input_index);
-        auto input_buffer = _execution->getInputBuffer(input_index);
+      // Copy execution context for backup: I/O buffer, shape, and execution options
+      const onert::exec::ExecutionContext ctx_backup = _execution->context();
 
-        _input_buffers.push_back(input_buffer);
+      // Set compile option to use float type
+      for (auto input_index = IOIndex{0}; input_index < IOIndex{input_size}; input_index++)
         _coptions->input_type.insert_or_assign(input_index, TypeInfo(DataType::FLOAT32));
-      }
 
       // Save Outputs buffers
       for (auto output_index = IOIndex{0}; output_index < IOIndex{output_size}; output_index++)
-      {
-        auto output_Shape = _execution->getOutputShape(output_index);
-        auto output_buffer = _execution->getOutputBuffer(output_index);
-
-        _output_buffers.push_back(output_buffer);
         _coptions->output_type.insert_or_assign(output_index, TypeInfo(DataType::FLOAT32));
-      }
-
-      // Save execution options
-      auto saved_options = _execution->executionOptions();
 
       // if there is compiled model - try to load it
       if (file_compiled_model.good())
@@ -2350,41 +2335,8 @@ NNFW_STATUS nnfw_session::run_with_auto_compilation(const char *target, NNFW_COD
       if (status != NNFW_STATUS_NO_ERROR)
         return status;
 
-      // Restore execution options
-      _execution->executionOptions() = saved_options;
-
-      // Restore inputs to the quantized or compiled model
-      for (uint32_t input_index = 0; input_index < _input_buffers.size(); input_index++)
-      {
-        nnfw_tensorinfo ti;
-        status = input_tensorinfo(input_index, &ti);
-        if (status != NNFW_STATUS_NO_ERROR)
-          return status;
-
-        auto input_size_in_bytes = getBufSize(&ti);
-
-        status = set_input(input_index, ti.dtype, _input_buffers[input_index], input_size_in_bytes);
-
-        if (status != NNFW_STATUS_NO_ERROR)
-          return status;
-      }
-
-      // Restore outputs to the quantized or compiled model
-      for (uint32_t output_index = 0; output_index < _output_buffers.size(); output_index++)
-      {
-
-        nnfw_tensorinfo ti;
-        status = output_tensorinfo(output_index, &ti);
-        if (status != NNFW_STATUS_NO_ERROR)
-          return status;
-
-        uint64_t output_size_in_bytes = getBufSize(&ti);
-
-        status =
-          set_output(output_index, ti.dtype, _output_buffers[output_index], output_size_in_bytes);
-        if (status != NNFW_STATUS_NO_ERROR)
-          return status;
-      }
+      // Restore execution context: I/O buffer, shape, and execution options
+      _execution->restoreContext(ctx_backup);
     }
 
     // Run quantized model
 
@@ -69,38 +69,28 @@ class Execution
    */
   void setInput(const ir::IOIndex &index, const void *buffer, size_t length);
 
-  /**
-   * @brief     Set input data's information, especially to specify unknown dimensions on model
-   * build time.
-   * @param[in] index   Input index
-   * @param[in] shape   Input data's shape
-   * @param[in] buffer  Input data's buffer pointer
-   * @param[in] length  Input data's length
-   */
-  void setInput(const ir::IOIndex &index, const ir::Shape &shape, const void *buffer,
-                size_t length);
   /**
    * @brief     Set output data's information
    * @param[in] index   Output index
    * @param[in] buffer  Output data's buffer pointer
    * @param[in] length  Output data's length
    */
   void setOutput(const ir::IOIndex &index, void *buffer, size_t length);
-  /**
-   * @brief     Set output data's information, especially to specify unknown dimensions on model
-   * build time.
-   * @param[in] index   Output index
-   * @param[in] shape   Output data's shape
-   * @param[in] buffer  Output data's buffer pointer
-   * @param[in] length  Output data's length
-   */
-  void setOutput(const ir::IOIndex &index, const ir::Shape &shape, void *buffer, size_t length);
+
   /**
    * @brief     Get the Input Info object
    * @param[in] index Input index
    * @return    Input info
    */
-  const ir::OperandInfo &getInputInfo(uint32_t index) { return _ctx.desc.inputs.at(index)->info; }
+  const ir::OperandInfo &inputInfo(uint32_t index) { return _ctx.desc.inputs.at(index).info; }
+
+  /**
+   * @brief     Get the Output Info object
+   * @param[in] index Output index
+   * @return    Output info
+   */
+  const ir::OperandInfo &outputInfo(uint32_t index) { return _ctx.desc.outputs.at(index).info; }
+
   /**
    * @brief  Execution
    * @note   It should be called after setting input and output buffer
@@ -151,24 +141,17 @@ class Execution
     const std::function<void(const ir::OperandIndex &, const backend::train::ITrainableTensor *)>
       &fn) const;
 
-  ir::Shape getInputShape(ir::IOIndex ind) const;
-  ir::Shape getOutputShape(ir::IOIndex ind) const;
-  size_t getInputTotalSize(ir::IOIndex ind) const;
-  size_t getOutputTotalSize(ir::IOIndex ind) const;
-
   /**
-   * @brief     Get pointer of Input Buffer
-   * @param[in] index     Input index
-   * @return    Pointer of Input Buffer
+   * @brief   Get context of execution
+   * @return  Execution context
    */
-  const void *getInputBuffer(ir::IOIndex ind) const;
+  const ExecutionContext &context() const { return _ctx; }
 
   /**
-   * @brief     Get pointer of Output Buffer
-   * @param[in] index     Output index
-   * @return    Pointer of Output Buffer
+   * @brief     Set context of execution at once
+   * @param[in] ctx Execution context
    */
-  void *getOutputBuffer(ir::IOIndex ind);
+  void restoreContext(const ExecutionContext &ctx) { _ctx = ctx; }
 
   ExecutionOptions &executionOptions() { return _ctx.options; }
 
 
@@ -49,8 +49,8 @@ struct OutputDesc
 
 struct IODescription
 {
-  std::vector<std::unique_ptr<InputDesc>> inputs;
-  std::vector<std::unique_ptr<OutputDesc>> outputs;
+  std::vector<InputDesc> inputs;
+  std::vector<OutputDesc> outputs;
 };
 
 struct ExecutionOptions
 
@@ -98,10 +98,10 @@ class IExecutors
   virtual const backend::IPortableTensor *outputTensor(const ir::IOIndex &index) const = 0;
 
   /**
-   * @brief     Execute NN package executor set
-   * @param[in] ctx  Execution context
+   * @brief         Execute NN package executor set
+   * @param[inout]  ctx Execution context. It reflects execution result (ex. output shape inference)
    */
-  virtual void execute(const ExecutionContext &ctx) = 0;
+  virtual void execute(ExecutionContext &ctx) = 0;
 };
 
 } // namespace onert::exec
 
@@ -32,13 +32,11 @@ Execution::Execution(const std::shared_ptr<IExecutors> &executors) : _executors{
   assert(executors->entryExecutor() != nullptr);
 
   // Initialize I/O description
-  _ctx.desc.inputs.resize(_executors->inputSize());
   for (uint32_t i = 0; i < _executors->inputSize(); ++i)
-    _ctx.desc.inputs.at(i) = std::make_unique<InputDesc>(_executors->inputInfo(ir::IOIndex(i)));
+    _ctx.desc.inputs.emplace_back(_executors->inputInfo(ir::IOIndex(i)));
 
-  _ctx.desc.outputs.resize(_executors->outputSize());
   for (uint32_t i = 0; i < _executors->outputSize(); ++i)
-    _ctx.desc.outputs.at(i) = std::make_unique<OutputDesc>(_executors->outputInfo(ir::IOIndex(i)));
+    _ctx.desc.outputs.emplace_back(_executors->outputInfo(ir::IOIndex(i)));
   _ctx.shape_updated = false;
 
   _is_internal_output_tensor.resize(_executors->outputSize());
@@ -62,9 +60,9 @@ void Execution::changeInputShape(const ir::IOIndex &index, const ir::Shape &new_
   // Note that 'compiled' model will not be updated with new_shape
   // but new_shape will change model input shape while 'running' the model
   auto &input_desc = _ctx.desc.inputs.at(index.value());
-  if (new_shape != input_desc->info.shape())
+  if (new_shape != input_desc.info.shape())
   {
-    input_desc->info.shape(new_shape);
+    input_desc.info.shape(new_shape);
     _ctx.shape_updated = true;
 
     VERBOSE(Execution) << "Model input shape will be changed at the start of execute()"
@@ -77,15 +75,8 @@ void Execution::setInput(const ir::IOIndex &index, const void *buffer, size_t le
 {
   // Length validation in execute(): datatype can be changed by API call
   auto &input_desc = _ctx.desc.inputs.at(index.value());
-  input_desc->buffer = buffer;
-  input_desc->size = length;
-}
-
-void Execution::setInput(const ir::IOIndex &index, const ir::Shape &shape, const void *buffer,
-                         size_t length)
-{
-  changeInputShape(index, shape);
-  setInput(index, buffer, length);
+  input_desc.buffer = buffer;
+  input_desc.size = length;
 }
 
 void Execution::setOutput(const ir::IOIndex &index, void *buffer, size_t length)
@@ -94,17 +85,8 @@ void Execution::setOutput(const ir::IOIndex &index, void *buffer, size_t length)
   // - datatype can be changed by API call
   // - shape can be changed by dynamic shape inference
   auto &output_desc = _ctx.desc.outputs.at(index.value());
-  output_desc->buffer = buffer;
-  output_desc->size = length;
-}
-
-void Execution::setOutput(const ir::IOIndex &index, const ir::Shape &shape, void *buffer,
-                          size_t length)
-{
-  auto &output_desc = _ctx.desc.outputs.at(index.value());
-  output_desc->info.shape(shape);
-
-  setOutput(index, buffer, length);
+  output_desc.buffer = buffer;
+  output_desc.size = length;
 }
 
 void Execution::execute()
@@ -114,7 +96,7 @@ void Execution::execute()
   // Input length validation check
   for (const auto &input : _ctx.desc.inputs)
   {
-    if (input->info.total_size() > input->size)
+    if (input.info.total_size() > input.size)
       throw std::runtime_error{"Too small input buffer length"};
   }
 
@@ -126,9 +108,9 @@ void Execution::execute()
     {
       const bool is_managed_internally = _is_internal_output_tensor.at(i);
       const auto &output = _ctx.desc.outputs.at(i);
-      if (!is_managed_internally && output->info.total_size() > output->size)
+      if (!is_managed_internally && output.info.total_size() > output.size)
         throw std::runtime_error{"Too small output buffer length"};
-      if (is_managed_internally && output->buffer != nullptr)
+      if (is_managed_internally && output.buffer != nullptr)
         VERBOSE(Execution) << "Warning: Output buffer was set from API even though the output "
                               "tensor was allocated internally"
                            << std::endl;
@@ -193,41 +175,4 @@ void Execution::iterateTrainableTensors(
   execs->iterateTrainableTensors(fn);
 }
 
-ir::Shape Execution::getInputShape(ir::IOIndex ind) const
-{
-  return _ctx.desc.inputs.at(ind.value())->info.shape();
-}
-
-// NNAPI return fail if ANeuralNetworksExecution_getOutputOperandRank or
-// ANeuralNetworksExecution_getOutputOperandDimensions is called before execution.
-// On the other hand, NNFW API return static shape inference result if nnfw_output_tensorinfo is
-// called before execution.
-// To handle both case, this method retun static shape inference result and fail will be handled on
-// NNAPI frontend.
-ir::Shape Execution::getOutputShape(ir::IOIndex ind) const
-{
-  return _ctx.desc.outputs.at(ind.value())->info.shape();
-}
-
-size_t Execution::getInputTotalSize(ir::IOIndex ind) const
-{
-  // TODO Support dynamic shape
-  return _ctx.desc.inputs.at(ind.value())->info.total_size();
-}
-
-size_t Execution::getOutputTotalSize(ir::IOIndex ind) const
-{
-  return _ctx.desc.outputs.at(ind.value())->info.total_size();
-}
-
-const void *Execution::getInputBuffer(ir::IOIndex ind) const
-{
-  return _ctx.desc.inputs.at(ind.value())->buffer;
-}
-
-void *Execution::getOutputBuffer(ir::IOIndex ind)
-{
-  return _ctx.desc.outputs.at(ind.value())->buffer;
-}
-
 } // namespace onert::exec
@@ -366,12 +366,14 @@ TEST(ExecInstance, neg_small_inoutsize)
 
   onert::exec::Execution execution{executors};
 
-  execution.setInput(input1, new_shape, reinterpret_cast<const void *>(input1_buffer), 8);
-  execution.setInput(input2, new_shape, reinterpret_cast<const void *>(input2_buffer), 2);
+  execution.changeInputShape(input1, new_shape);
+  execution.changeInputShape(input2, new_shape);
+  execution.setInput(input1, reinterpret_cast<const void *>(input1_buffer), 8);
+  execution.setInput(input2, reinterpret_cast<const void *>(input2_buffer), 2);
   EXPECT_THROW(execution.execute(), std::exception);
 
   // Not throw exception because input shape is changed and output buffer is enough
-  execution.setInput(input2, new_shape, reinterpret_cast<const void *>(input2_buffer), 8);
+  execution.setInput(input2, reinterpret_cast<const void *>(input2_buffer), 8);
   execution.setOutput(output, reinterpret_cast<void *>(output_buffer), 16);
   execution.execute();
 
@@ -762,12 +764,9 @@ TEST(ExecInstance, multi_model_dequant_input_quant_output)
   auto executors = mockup.artifact->_executors;
 
   onert::exec::Execution execution{executors};
-  execution.setInput(input1, execution.getInputShape(input1),
-                     reinterpret_cast<const void *>(input1_buffer), 4);
-  execution.setInput(input2, execution.getInputShape(input2),
-                     reinterpret_cast<const void *>(input2_buffer), 4);
-  execution.setOutput(output, execution.getOutputShape(output),
-                      reinterpret_cast<void *>(output_buffer), 4);
+  execution.setInput(input1, reinterpret_cast<const void *>(input1_buffer), 4);
+  execution.setInput(input2, reinterpret_cast<const void *>(input2_buffer), 4);
+  execution.setOutput(output, reinterpret_cast<void *>(output_buffer), 4);
   execution.execute();
 
   for (auto i = 0; i < 4; i++)
Original file line number	Diff line number	Diff line change
`@@ -49,8 +49,8 @@ struct OutputDesc`
`49`	`49`
`50`	`50`	`struct IODescription`
`51`	`51`	`{`
`52`		`- std::vector<std::unique_ptr<InputDesc>> inputs;`
`53`		`- std::vector<std::unique_ptr<OutputDesc>> outputs;`
	`52`	`+ std::vector<InputDesc> inputs;`
	`53`	`+ std::vector<OutputDesc> outputs;`
`54`	`54`	`};`
`55`	`55`
`56`	`56`	`struct ExecutionOptions`