Paddle/paddle/framework/executor_test.cc

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/framework/executor.h"

#include <memory>
#include <vector>

#include "gflags/gflags.h"
#include "gtest/gtest.h"
#include "paddle/framework/attribute.h"
#include "paddle/framework/backward.h"
#include "paddle/framework/block_desc.h"
#include "paddle/framework/op_desc.h"
#include "paddle/framework/op_registry.h"
#include "paddle/framework/operator.h"

USE_OP(elementwise_add);
USE_OP(gaussian_random);
USE_OP(feed);
USE_OP(fetch);
USE_OP(mul);
USE_OP(sum);
USE_OP(squared_l2_distance);
USE_OP(fill_constant);
USE_OP(mean);
USE_OP(sgd);

using namespace paddle::platform;
using namespace paddle::framework;

void AddOp(const std::string& type, const VariableNameMap& inputs,
           const VariableNameMap& outputs, AttributeMap attrs,
           paddle::framework::BlockDescBind* block) {
  // insert output
  for (auto kv : outputs) {
    for (auto v : kv.second) {
      // <<<<<<< HEAD
      //       auto var = block->Var(v);
      //       var->SetType(VarDesc::LOD_TENSOR);
      //       var->SetDataType(paddle::framework::DataType::FP32);
      // =======
      if (!block->HasVar(v)) {
        auto var = block->Var(v);
        var->SetDataType(paddle::framework::DataType::FP32);
      }
      // >>>>>>> origin/develop
    }
  }

  // insert op
  auto op = block->AppendOp();
  op->SetType(type);
  for (auto& kv : inputs) {
    op->SetInput(kv.first, kv.second);
  }
  for (auto& kv : outputs) {
    op->SetOutput(kv.first, kv.second);
  }
  op->SetAttrMap(attrs);
  op->CheckAttrs();
}

// Tensors in feed value variable will only be in CPUPlace
// So we can memcpy the data from vector<T> to feed_value
template <typename T>
void SetFeedVariable(const std::vector<std::vector<T>>& inputs,
                     const std::vector<std::vector<int64_t>>& dims) {
  Variable* g_feed_value = GetGlobalScope().FindVar("feed_value");
  auto& feed_inputs =
      *(g_feed_value->GetMutable<std::vector<paddle::framework::Tensor>>());
  size_t size = inputs.size();
  feed_inputs.resize(size);
  for (size_t i = 0; i < size; i++) {
    T* dst = feed_inputs[i].mutable_data<T>(make_ddim(dims[i]), CPUPlace());
    memcpy(dst, inputs[i].data(), inputs[i].size() * sizeof(T));
  }
}

// Tensors in fetch value variable will only be in CPUPlace
// So we can memcpy the data from fetch_value to vector<T>
template <typename T>
std::vector<std::vector<T>> GetFetchVariable() {
  Variable* g_fetch_value = GetGlobalScope().FindVar("fetch_value");
  auto& fetch_outputs =
      *(g_fetch_value->GetMutable<std::vector<paddle::framework::Tensor>>());

  size_t size = fetch_outputs.size();
  std::vector<std::vector<T>> result;
  result.reserve(size);
  for (size_t i = 0; i < size; i++) {
    std::vector<T> tmp;
    tmp.resize(fetch_outputs[i].numel());
    memcpy(tmp.data(), fetch_outputs[i].data<T>(),
           fetch_outputs[i].numel() * sizeof(T));
    result.push_back(tmp);
  }

  return result;
}

class ExecutorTesterRandom : public ::testing::Test {
 public:
  virtual void SetUp() override {
    int input_dim = 3, batch_size = 2, embed_dim = 5;

    auto temp_init_root_block = init_pdesc_.add_blocks();
    temp_init_root_block->set_idx(0);
    temp_init_root_block->set_parent_idx(-1);
    paddle::framework::ProgramDescBind& init_program =
        paddle::framework::ProgramDescBind::Instance(&init_pdesc_);
    paddle::framework::BlockDescBind* init_root_block = init_program.Block(0);

    AddOp("gaussian_random", {}, {{"Out", {"w1"}}},
          {{"dims", std::vector<int>{input_dim, embed_dim}}}, init_root_block);
    AddOp("gaussian_random", {}, {{"Out", {"w2"}}},
          {{"dims", std::vector<int>{embed_dim, input_dim}}}, init_root_block);
    AddOp("fetch", {{"Input", {"w1"}}}, {}, {{"col", 0}}, init_root_block);
    AddOp("fetch", {{"Input", {"w2"}}}, {}, {{"col", 1}}, init_root_block);

    // flush
    init_program.Proto();

    // run block
    auto temp_root_block = pdesc_.add_blocks();
    temp_root_block->set_idx(0);
    temp_root_block->set_parent_idx(-1);
    paddle::framework::ProgramDescBind& program =
        paddle::framework::ProgramDescBind::Instance(&pdesc_);
    paddle::framework::BlockDescBind* root_block = program.Block(0);

    // feed data
    inputs_.push_back({1.0, 1.0, 1.0, 1.0, 1.0, 1.0});
    dims_.push_back({batch_size, input_dim});
    AddOp("feed", {}, {{"Out", {"a"}}},
          {{"dims", std::vector<int>{batch_size, input_dim}}, {"col", 0}},
          root_block);

    // forward
    AddOp("mul", {{"X", {"a"}}, {"Y", {"w1"}}}, {{"Out", {"b"}}}, {},
          root_block);
    AddOp("mul", {{"X", {"b"}}, {"Y", {"w2"}}}, {{"Out", {"a_out"}}}, {},
          root_block);
    AddOp("squared_l2_distance", {{"X", {"a"}}, {"Y", {"a_out"}}},
          {{"Out", {"l2_distance"}}, {"sub_result", {"l2_distance_sub"}}}, {},
          root_block);
    AddOp("mean", {{"X", {"l2_distance"}}}, {{"Out", {"mean_out"}}}, {},
          root_block);

    // backward
    auto target = VarDescBind("mean_out");
    AppendBackward(program, target, {});

    // update
    AddOp("fill_constant", {}, {{"Out", {"learning_rate"}}},
          {{"shape", std::vector<int>{1}}, {"value", float(0.001)}},
          root_block);
    AddOp("sgd", {{"Param", {"w1"}},
                  {"LearningRate", {"learning_rate"}},
                  {"Grad", {"w1@GRAD"}}},
          {{"ParamOut", {"w1"}}}, {}, root_block);
    AddOp("sgd", {{"Param", {"w2"}},
                  {"LearningRate", {"learning_rate"}},
                  {"Grad", {"w2@GRAD"}}},
          {{"ParamOut", {"w2"}}}, {}, root_block);

    AddOp("fetch", {{"Input", {"w1"}}}, {}, {{"col", 0}}, root_block);
    AddOp("fetch", {{"Input", {"w2"}}}, {}, {{"col", 1}}, root_block);
    AddOp("fetch", {{"Input", {"l2_distance"}}}, {}, {{"col", 0}}, root_block);

    // flush
    program.Proto();
  }

 protected:
  ProgramDesc init_pdesc_;
  ProgramDesc pdesc_;
  std::vector<std::vector<float>> inputs_;
  std::vector<std::vector<int64_t>> dims_;
};

class ExecutorTesterFeedAndFetch : public ::testing::Test {
 public:
  virtual void SetUp() override {
    auto temp_root_block = pdesc_.add_blocks();
    temp_root_block->set_idx(0);
    temp_root_block->set_parent_idx(-1);

    // wrap to BlockDescBind
    paddle::framework::ProgramDescBind& program =
        paddle::framework::ProgramDescBind::Instance(&pdesc_);
    paddle::framework::BlockDescBind* root_block = program.Block(0);

    std::vector<int> dim{6};

    AddOp("feed", {}, {{"Out", {"a"}}}, {{"dims", dim}, {"col", 0}},
          root_block);
    AddOp("feed", {}, {{"Out", {"b"}}}, {{"dims", dim}, {"col", 1}},
          root_block);
    AddOp("fetch", {{"Input", {"a"}}}, {}, {{"col", 0}}, root_block);
    AddOp("fetch", {{"Input", {"b"}}}, {}, {{"col", 1}}, root_block);

    // flush
    program.Proto();

    std::vector<float> vec1 = {1.0, 2.0, 3.0, 4.0, 5.0, 6.0};
    std::vector<float> vec2 = {4.0, 5.0, 6.0, 7.0, 8.0, 9.0};
    inputs_.push_back(vec1);
    inputs_.push_back(vec2);
    dims_.push_back({static_cast<int64_t>(vec1.size())});
    dims_.push_back({static_cast<int64_t>(vec2.size())});
  }

 protected:
  ProgramDesc pdesc_;
  std::vector<std::vector<float>> inputs_;
  std::vector<std::vector<int64_t>> dims_;
};

#ifndef PADDLE_WITH_CUDA
TEST_F(ExecutorTesterRandom, CPU) {
  std::vector<Place> places;
  CPUPlace cpu_place;
  places.push_back(cpu_place);

  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  paddle::memory::Used(cpu_place);

  std::unique_ptr<Executor> executor(new Executor(places));

  executor->Run(init_pdesc_, &GetGlobalScope(), 0);
  SetFeedVariable<float>(inputs_, dims_);
  executor->Run(pdesc_, &GetGlobalScope(), 0);
  std::vector<std::vector<float>> result = GetFetchVariable<float>();
}

TEST_F(ExecutorTesterFeedAndFetch, CPU) {
  std::vector<Place> places;
  CPUPlace cpu_place;
  places.push_back(cpu_place);

  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  paddle::memory::Used(cpu_place);

  std::unique_ptr<Executor> executor(new Executor(places));

  for (int batch_id = 0; batch_id < 3; batch_id++) {
    SetFeedVariable<float>(inputs_, dims_);
    executor->Run(pdesc_, &GetGlobalScope(), 0);
    std::vector<std::vector<float>> result = GetFetchVariable<float>();
    PADDLE_ENFORCE_EQ(result.size(), inputs_.size());
    for (size_t i = 0; i < result.size(); ++i) {
      PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());
      for (size_t j = 0; j < result[i].size(); ++j) {
        PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);
      }
    }
  }
}
#else
TEST_F(ExecutorTesterRandom, GPU) {
  std::vector<Place> places;
  GPUPlace gpu_place(0);
  places.push_back(gpu_place);

  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  // If paddle is compiled with GPU, both CPU and GPU BuddyAllocator
  // need to be used at first.
  paddle::memory::Used(CPUPlace());
  paddle::memory::Used(gpu_place);

  std::unique_ptr<Executor> executor(new Executor(places));

  executor->Run(init_pdesc_, &GetGlobalScope(), 0);
  for (int batch_id = 0; batch_id < 3; batch_id++) {
    SetFeedVariable<float>(inputs_, dims_);
    executor->Run(pdesc_, &GetGlobalScope(), 0);
  }
}

TEST_F(ExecutorTesterFeedAndFetch, GPU) {
  std::vector<Place> places;
  GPUPlace gpu_place(0);
  places.push_back(gpu_place);
  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  // If paddle is compiled with GPU, both CPU and GPU BuddyAllocator
  // need to be used at first.
  paddle::memory::Used(CPUPlace());
  paddle::memory::Used(gpu_place);

  std::unique_ptr<Executor> executor(new Executor(places));

  for (int batch_id = 0; batch_id < 3; batch_id++) {
    SetFeedVariable<float>(inputs_, dims_);
    executor->Run(pdesc_, &GetGlobalScope(), 0);
    std::vector<std::vector<float>> result = GetFetchVariable<float>();
    PADDLE_ENFORCE_EQ(result.size(), inputs_.size());
    for (size_t i = 0; i < result.size(); ++i) {
      PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());
      for (size_t j = 0; j < result[i].size(); ++j) {
        PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);
      }
    }
  }
}

DECLARE_double(fraction_of_gpu_memory_to_use);

int main(int argc, char** argv) {
  testing::InitGoogleTest(&argc, argv);
  // Use less GPU memory for unittest.
  FLAGS_fraction_of_gpu_memory_to_use = 0.25;
  return RUN_ALL_TESTS();
}

#endif
add executor class and interface 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.`

			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#include "paddle/framework/executor.h"`
clean up for review 7 years ago
			`#include <memory>`
add executor feed operator test 7 years ago			`#include <vector>`
clean up for review 7 years ago
Stablize executor_test (#4774) Use less GPU memory 7 years ago			`#include "gflags/gflags.h"`
add elementwise_add 7 years ago			`#include "gtest/gtest.h"`
simple test 7 years ago			`#include "paddle/framework/attribute.h"`
before backward 7 years ago			`#include "paddle/framework/backward.h"`
Add AddOp 7 years ago			`#include "paddle/framework/block_desc.h"`
			`#include "paddle/framework/op_desc.h"`
add elementwise_add 7 years ago			`#include "paddle/framework/op_registry.h"`
			`#include "paddle/framework/operator.h"`

debug executor_test 7 years ago			`USE_OP(elementwise_add);`
			`USE_OP(gaussian_random);`
			`USE_OP(feed);`
			`USE_OP(fetch);`
			`USE_OP(mul);`
			`USE_OP(sum);`
			`USE_OP(squared_l2_distance);`
			`USE_OP(fill_constant);`
create grad_var when run Backward pass (#4796) * add target to Backward, generate var in block when call backward * modify backward_test * fix executor_test * set var desc default type to LOD_TENSOR * update backward_test * insert loss in the top level of backward * create grad vars for all blocks in current program * optimize code * update test_program.py * only create var for newly create blocks when backward 7 years ago			`USE_OP(mean);`
debug executor_test 7 years ago			`USE_OP(sgd);`

add executor unittest 7 years ago			`using namespace paddle::platform;`
			`using namespace paddle::framework;`

Add AddOp 7 years ago			`void AddOp(const std::string& type, const VariableNameMap& inputs,`
			`const VariableNameMap& outputs, AttributeMap attrs,`
clean up && fix #4624 7 years ago			`paddle::framework::BlockDescBind* block) {`
Add AddOp 7 years ago			`// insert output`
			`for (auto kv : outputs) {`
			`for (auto v : kv.second) {`
Merge remote-tracking branch 'origin/develop' into fix/scope 7 years ago			`// <<<<<<< HEAD`
			`// auto var = block->Var(v);`
			`// var->SetType(VarDesc::LOD_TENSOR);`
			`// var->SetDataType(paddle::framework::DataType::FP32);`
			`// =======`
create grad_var when run Backward pass (#4796) * add target to Backward, generate var in block when call backward * modify backward_test * fix executor_test * set var desc default type to LOD_TENSOR * update backward_test * insert loss in the top level of backward * create grad vars for all blocks in current program * optimize code * update test_program.py * only create var for newly create blocks when backward 7 years ago			`if (!block->HasVar(v)) {`
Merge remote-tracking branch 'origin/develop' into fix/scope 7 years ago			`auto var = block->Var(v);`
create grad_var when run Backward pass (#4796) * add target to Backward, generate var in block when call backward * modify backward_test * fix executor_test * set var desc default type to LOD_TENSOR * update backward_test * insert loss in the top level of backward * create grad vars for all blocks in current program * optimize code * update test_program.py * only create var for newly create blocks when backward 7 years ago			`var->SetDataType(paddle::framework::DataType::FP32);`
			`}`
Merge remote-tracking branch 'origin/develop' into fix/scope 7 years ago			`// >>>>>>> origin/develop`
Add AddOp 7 years ago			`}`
			`}`

			`// insert op`
clean up && fix #4624 7 years ago			`auto op = block->AppendOp();`
			`op->SetType(type);`
clean up for review 7 years ago			`for (auto& kv : inputs) {`
clean up && fix #4624 7 years ago			`op->SetInput(kv.first, kv.second);`
Add AddOp 7 years ago			`}`
clean up for review 7 years ago			`for (auto& kv : outputs) {`
clean up && fix #4624 7 years ago			`op->SetOutput(kv.first, kv.second);`
Add AddOp 7 years ago			`}`
clean up && fix #4624 7 years ago			`op->SetAttrMap(attrs);`
Remove attribute check from CreateGradOpDescs() (#4723) * Remove attr_checker from CreateGradOpDescs() * Fix merge error * Fix bug in backward_test.cc 7 years ago			`op->CheckAttrs();`
Add AddOp 7 years ago			`}`

FeedOp and FetchOp unit test 7 years ago			`// Tensors in feed value variable will only be in CPUPlace`
follow comments and refine codes 7 years ago			`// So we can memcpy the data from vector<T> to feed_value`
add executor feed operator test 7 years ago			`template <typename T>`
set variable support dim 7 years ago			`void SetFeedVariable(const std::vector<std::vector<T>>& inputs,`
			`const std::vector<std::vector<int64_t>>& dims) {`
follow comments 7 years ago			`Variable* g_feed_value = GetGlobalScope().FindVar("feed_value");`
follow comments and refine codes 7 years ago			`auto& feed_inputs =`
			`*(g_feed_value->GetMutable<std::vector<paddle::framework::Tensor>>());`
clean up for review 7 years ago			`size_t size = inputs.size();`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`feed_inputs.resize(size);`
add executor feed operator test 7 years ago			`for (size_t i = 0; i < size; i++) {`
set variable support dim 7 years ago			`T* dst = feed_inputs[i].mutable_data<T>(make_ddim(dims[i]), CPUPlace());`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`memcpy(dst, inputs[i].data(), inputs[i].size() * sizeof(T));`
add executor feed operator test 7 years ago			`}`
			`}`

FeedOp and FetchOp unit test 7 years ago			`// Tensors in fetch value variable will only be in CPUPlace`
			`// So we can memcpy the data from fetch_value to vector<T>`
add fetch operator 7 years ago			`template <typename T>`
clean up for review 7 years ago			`std::vector<std::vector<T>> GetFetchVariable() {`
follow comments 7 years ago			`Variable* g_fetch_value = GetGlobalScope().FindVar("fetch_value");`
follow comments and refine codes 7 years ago			`auto& fetch_outputs =`
			`*(g_fetch_value->GetMutable<std::vector<paddle::framework::Tensor>>());`
add fetch operator 7 years ago
clean up for review 7 years ago			`size_t size = fetch_outputs.size();`
add fetch operator 7 years ago			`std::vector<std::vector<T>> result;`
			`result.reserve(size);`
			`for (size_t i = 0; i < size; i++) {`
			`std::vector<T> tmp;`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`tmp.resize(fetch_outputs[i].numel());`
add fetch operator 7 years ago			`memcpy(tmp.data(), fetch_outputs[i].data<T>(),`
			`fetch_outputs[i].numel() * sizeof(T));`
			`result.push_back(tmp);`
			`}`
FeedOp and FetchOp unit test 7 years ago
add fetch operator 7 years ago			`return result;`
			`}`

add executor feed operator test 7 years ago			`class ExecutorTesterRandom : public ::testing::Test {`
refine codes 7 years ago			`public:`
			`virtual void SetUp() override {`
set variable support dim 7 years ago			`int input_dim = 3, batch_size = 2, embed_dim = 5;`
Add AddOp 7 years ago
debug for sum 7 years ago			`auto temp_init_root_block = init_pdesc_.add_blocks();`
			`temp_init_root_block->set_idx(0);`
			`temp_init_root_block->set_parent_idx(-1);`
			`paddle::framework::ProgramDescBind& init_program =`
			`paddle::framework::ProgramDescBind::Instance(&init_pdesc_);`
			`paddle::framework::BlockDescBind* init_root_block = init_program.Block(0);`
clean up && fix #4624 7 years ago
Add AddOp 7 years ago			`AddOp("gaussian_random", {}, {{"Out", {"w1"}}},`
debug for sum 7 years ago			`{{"dims", std::vector<int>{input_dim, embed_dim}}}, init_root_block);`
Add AddOp 7 years ago			`AddOp("gaussian_random", {}, {{"Out", {"w2"}}},`
debug for sum 7 years ago			`{{"dims", std::vector<int>{embed_dim, input_dim}}}, init_root_block);`
make infershape of feedop and fetchop compatible with compile-time design 7 years ago			`AddOp("fetch", {{"Input", {"w1"}}}, {}, {{"col", 0}}, init_root_block);`
			`AddOp("fetch", {{"Input", {"w2"}}}, {}, {{"col", 1}}, init_root_block);`
debug for sum 7 years ago
			`// flush`
			`init_program.Proto();`

pass simple backward 7 years ago			`// run block`
debug for sum 7 years ago			`auto temp_root_block = pdesc_.add_blocks();`
			`temp_root_block->set_idx(0);`
			`temp_root_block->set_parent_idx(-1);`
			`paddle::framework::ProgramDescBind& program =`
			`paddle::framework::ProgramDescBind::Instance(&pdesc_);`
			`paddle::framework::BlockDescBind* root_block = program.Block(0);`
refine codes 7 years ago
set variable support dim 7 years ago			`// feed data`
clean up 7 years ago			`inputs_.push_back({1.0, 1.0, 1.0, 1.0, 1.0, 1.0});`
set variable support dim 7 years ago			`dims_.push_back({batch_size, input_dim});`
			`AddOp("feed", {}, {{"Out", {"a"}}},`
			`{{"dims", std::vector<int>{batch_size, input_dim}}, {"col", 0}},`
			`root_block);`

pass simple backward 7 years ago			`// forward`
remove hardcode add_XX_op 7 years ago			`AddOp("mul", {{"X", {"a"}}, {"Y", {"w1"}}}, {{"Out", {"b"}}}, {},`
debug for sum 7 years ago			`root_block);`
remove hardcode add_XX_op 7 years ago			`AddOp("mul", {{"X", {"b"}}, {"Y", {"w2"}}}, {{"Out", {"a_out"}}}, {},`
debug for sum 7 years ago			`root_block);`
before backward 7 years ago			`AddOp("squared_l2_distance", {{"X", {"a"}}, {"Y", {"a_out"}}},`
			`{{"Out", {"l2_distance"}}, {"sub_result", {"l2_distance_sub"}}}, {},`
debug for sum 7 years ago			`root_block);`
create grad_var when run Backward pass (#4796) * add target to Backward, generate var in block when call backward * modify backward_test * fix executor_test * set var desc default type to LOD_TENSOR * update backward_test * insert loss in the top level of backward * create grad vars for all blocks in current program * optimize code * update test_program.py * only create var for newly create blocks when backward 7 years ago			`AddOp("mean", {{"X", {"l2_distance"}}}, {{"Out", {"mean_out"}}}, {},`
			`root_block);`
Init at block[0]; Run at block[1] 7 years ago
pass simple backward 7 years ago			`// backward`
create grad_var when run Backward pass (#4796) * add target to Backward, generate var in block when call backward * modify backward_test * fix executor_test * set var desc default type to LOD_TENSOR * update backward_test * insert loss in the top level of backward * create grad vars for all blocks in current program * optimize code * update test_program.py * only create var for newly create blocks when backward 7 years ago			`auto target = VarDescBind("mean_out");`
			`AppendBackward(program, target, {});`
pass simple backward 7 years ago
			`// update`
			`AddOp("fill_constant", {}, {{"Out", {"learning_rate"}}},`
clean up 7 years ago			`{{"shape", std::vector<int>{1}}, {"value", float(0.001)}},`
			`root_block);`
pass simple backward 7 years ago			`AddOp("sgd", {{"Param", {"w1"}},`
			`{"LearningRate", {"learning_rate"}},`
			`{"Grad", {"w1@GRAD"}}},`
			`{{"ParamOut", {"w1"}}}, {}, root_block);`
			`AddOp("sgd", {{"Param", {"w2"}},`
			`{"LearningRate", {"learning_rate"}},`
			`{"Grad", {"w2@GRAD"}}},`
			`{{"ParamOut", {"w2"}}}, {}, root_block);`

make infershape of feedop and fetchop compatible with compile-time design 7 years ago			`AddOp("fetch", {{"Input", {"w1"}}}, {}, {{"col", 0}}, root_block);`
			`AddOp("fetch", {{"Input", {"w2"}}}, {}, {{"col", 1}}, root_block);`
set variable support dim 7 years ago			`AddOp("fetch", {{"Input", {"l2_distance"}}}, {}, {{"col", 0}}, root_block);`
pass simple backward 7 years ago
clean up && fix #4624 7 years ago			`// flush`
			`program.Proto();`
refine codes 7 years ago			`}`
simple test 7 years ago
refine codes 7 years ago			`protected:`
debug for sum 7 years ago			`ProgramDesc init_pdesc_;`
refine codes 7 years ago			`ProgramDesc pdesc_;`
set variable support dim 7 years ago			`std::vector<std::vector<float>> inputs_;`
			`std::vector<std::vector<int64_t>> dims_;`
refine codes 7 years ago			`};`

FeedOp and FetchOp unit test 7 years ago			`class ExecutorTesterFeedAndFetch : public ::testing::Test {`
add executor feed operator test 7 years ago			`public:`
			`virtual void SetUp() override {`
clean up && fix #4624 7 years ago			`auto temp_root_block = pdesc_.add_blocks();`
			`temp_root_block->set_idx(0);`
			`temp_root_block->set_parent_idx(-1);`

			`// wrap to BlockDescBind`
			`paddle::framework::ProgramDescBind& program =`
			`paddle::framework::ProgramDescBind::Instance(&pdesc_);`
			`paddle::framework::BlockDescBind* root_block = program.Block(0);`
add executor feed operator test 7 years ago
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`std::vector<int> dim{6};`

remove hardcode add_XX_op 7 years ago			`AddOp("feed", {}, {{"Out", {"a"}}}, {{"dims", dim}, {"col", 0}},`
			`root_block);`
			`AddOp("feed", {}, {{"Out", {"b"}}}, {{"dims", dim}, {"col", 1}},`
			`root_block);`
make infershape of feedop and fetchop compatible with compile-time design 7 years ago			`AddOp("fetch", {{"Input", {"a"}}}, {}, {{"col", 0}}, root_block);`
			`AddOp("fetch", {{"Input", {"b"}}}, {}, {{"col", 1}}, root_block);`
add fetch operator 7 years ago
clean up && fix #4624 7 years ago			`// flush`
			`program.Proto();`

ensure global BuddyAllocator is initialized before global Scope 7 years ago			`std::vector<float> vec1 = {1.0, 2.0, 3.0, 4.0, 5.0, 6.0};`
			`std::vector<float> vec2 = {4.0, 5.0, 6.0, 7.0, 8.0, 9.0};`
add executor feed operator test 7 years ago			`inputs_.push_back(vec1);`
			`inputs_.push_back(vec2);`
set variable support dim 7 years ago			`dims_.push_back({static_cast<int64_t>(vec1.size())});`
			`dims_.push_back({static_cast<int64_t>(vec2.size())});`
add executor feed operator test 7 years ago			`}`

			`protected:`
			`ProgramDesc pdesc_;`
			`std::vector<std::vector<float>> inputs_;`
set variable support dim 7 years ago			`std::vector<std::vector<int64_t>> dims_;`
add executor feed operator test 7 years ago			`};`

fix executor gpu unittest runtime error 7 years ago			`#ifndef PADDLE_WITH_CUDA`
add executor feed operator test 7 years ago			`TEST_F(ExecutorTesterRandom, CPU) {`
follow comments 7 years ago			`std::vector<Place> places;`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`CPUPlace cpu_place;`
			`places.push_back(cpu_place);`

			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`paddle::memory::Used(cpu_place);`
follow comments 7 years ago
clean up for review 7 years ago			`std::unique_ptr<Executor> executor(new Executor(places));`

follow comments 7 years ago			`executor->Run(init_pdesc_, &GetGlobalScope(), 0);`
			`SetFeedVariable<float>(inputs_, dims_);`
			`executor->Run(pdesc_, &GetGlobalScope(), 0);`
clean up for review 7 years ago			`std::vector<std::vector<float>> result = GetFetchVariable<float>();`
add executor feed operator test 7 years ago			`}`

FeedOp and FetchOp unit test 7 years ago			`TEST_F(ExecutorTesterFeedAndFetch, CPU) {`
add executor feed operator test 7 years ago			`std::vector<Place> places;`
			`CPUPlace cpu_place;`
			`places.push_back(cpu_place);`

ensure global BuddyAllocator is initialized before global Scope 7 years ago			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`paddle::memory::Used(cpu_place);`

clean up for review 7 years ago			`std::unique_ptr<Executor> executor(new Executor(places));`
add executor feed operator test 7 years ago
clean up for review 7 years ago			`for (int batch_id = 0; batch_id < 3; batch_id++) {`
set variable support dim 7 years ago			`SetFeedVariable<float>(inputs_, dims_);`
follow comments 7 years ago			`executor->Run(pdesc_, &GetGlobalScope(), 0);`
clean up for review 7 years ago			`std::vector<std::vector<float>> result = GetFetchVariable<float>();`
FeedOp and FetchOp unit test 7 years ago			`PADDLE_ENFORCE_EQ(result.size(), inputs_.size());`
			`for (size_t i = 0; i < result.size(); ++i) {`
			`PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());`
			`for (size_t j = 0; j < result[i].size(); ++j) {`
			`PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);`
add fetch operator 7 years ago			`}`
			`}`
add executor feed operator test 7 years ago			`}`
refine codes 7 years ago			`}`
fix executor gpu unittest runtime error 7 years ago			`#else`
add executor feed operator test 7 years ago			`TEST_F(ExecutorTesterRandom, GPU) {`
			`std::vector<Place> places;`
			`GPUPlace gpu_place(0);`
			`places.push_back(gpu_place);`

fix executor gpu unittest runtime error 7 years ago			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`// If paddle is compiled with GPU, both CPU and GPU BuddyAllocator`
			`// need to be used at first.`
			`paddle::memory::Used(CPUPlace());`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`paddle::memory::Used(gpu_place);`

clean up for review 7 years ago			`std::unique_ptr<Executor> executor(new Executor(places));`
Add AddOp 7 years ago
follow comments 7 years ago			`executor->Run(init_pdesc_, &GetGlobalScope(), 0);`
pass multiple forward backward 7 years ago			`for (int batch_id = 0; batch_id < 3; batch_id++) {`
set variable support dim 7 years ago			`SetFeedVariable<float>(inputs_, dims_);`
follow comments 7 years ago			`executor->Run(pdesc_, &GetGlobalScope(), 0);`
pass multiple forward backward 7 years ago			`}`
add executor feed operator test 7 years ago			`}`

FeedOp and FetchOp unit test 7 years ago			`TEST_F(ExecutorTesterFeedAndFetch, GPU) {`
refine codes 7 years ago			`std::vector<Place> places;`
add executor feed operator test 7 years ago			`GPUPlace gpu_place(0);`
			`places.push_back(gpu_place);`
fix executor gpu unittest runtime error 7 years ago			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`// If paddle is compiled with GPU, both CPU and GPU BuddyAllocator`
			`// need to be used at first.`
			`paddle::memory::Used(CPUPlace());`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`paddle::memory::Used(gpu_place);`

clean up for review 7 years ago			`std::unique_ptr<Executor> executor(new Executor(places));`
add executor feed operator test 7 years ago
clean up for review 7 years ago			`for (int batch_id = 0; batch_id < 3; batch_id++) {`
set variable support dim 7 years ago			`SetFeedVariable<float>(inputs_, dims_);`
follow comments 7 years ago			`executor->Run(pdesc_, &GetGlobalScope(), 0);`
clean up for review 7 years ago			`std::vector<std::vector<float>> result = GetFetchVariable<float>();`
FeedOp and FetchOp unit test 7 years ago			`PADDLE_ENFORCE_EQ(result.size(), inputs_.size());`
			`for (size_t i = 0; i < result.size(); ++i) {`
			`PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());`
			`for (size_t j = 0; j < result[i].size(); ++j) {`
			`PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);`
fix executor gpu unittest 7 years ago			`}`
			`}`
			`}`
simple test 7 years ago			`}`
Stablize executor_test (#4774) Use less GPU memory 7 years ago
			`DECLARE_double(fraction_of_gpu_memory_to_use);`

			`int main(int argc, char** argv) {`
			`testing::InitGoogleTest(&argc, argv);`
			`// Use less GPU memory for unittest.`
			`FLAGS_fraction_of_gpu_memory_to_use = 0.25;`
			`return RUN_ALL_TESTS();`
Fix CPU compile (#4781) 7 years ago			`}`

refine codes 7 years ago			`#endif`