Paddle/paddle/framework/executor_test.cc

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/framework/executor.h"
#include <vector>
#include "gtest/gtest.h"
#include "paddle/framework/attribute.h"
#include "paddle/framework/block_desc.h"
#include "paddle/framework/grad_op_builder.h"
#include "paddle/framework/op_desc.h"
#include "paddle/framework/op_registry.h"
#include "paddle/framework/operator.h"

USE_OP(elementwise_add);
USE_OP(gaussian_random);
USE_OP(feed);
USE_OP(fetch);
USE_OP(mul);

using std::string;
using namespace paddle::platform;
using namespace paddle::framework;

typedef paddle::framework::BlockDesc proto_block;
typedef paddle::framework::OpDesc proto_op;

struct SetAttrDescVisitor : public boost::static_visitor<void> {
  explicit SetAttrDescVisitor(OpDesc::Attr* attr) : attr_(attr) {}
  mutable OpDesc::Attr* attr_;
  void operator()(int v) const { attr_->set_i(v); }
  void operator()(float v) const { attr_->set_f(v); }
  void operator()(const std::string& v) const { attr_->set_s(v); }
  void operator()(bool b) const { attr_->set_b(b); }

  void operator()(const std::vector<int>& v) const {
    VectorToRepeated(v, attr_->mutable_ints());
  }
  void operator()(const std::vector<float>& v) const {
    VectorToRepeated(v, attr_->mutable_floats());
  }
  void operator()(const std::vector<std::string>& v) const {
    VectorToRepeated(v, attr_->mutable_strings());
  }
  void operator()(const std::vector<bool>& v) const {
    VectorToRepeated(v, attr_->mutable_bools());
  }
  void operator()(BlockDesc* desc) const { attr_->set_block_idx(desc->idx()); }
  void operator()(boost::blank) const { PADDLE_THROW("Unexpected branch"); }
};

void AddOp(const std::string& type, const VariableNameMap& inputs,
           const VariableNameMap& outputs, AttributeMap attrs,
           proto_block* block) {
  // insert output
  for (auto kv : outputs) {
    for (auto v : kv.second) {
      auto var = block->add_vars();
      var->set_name(v);
      auto var_lt = var->mutable_lod_tensor();
      var_lt->set_data_type(paddle::framework::DataType::FP32);
    }
  }

  // insert op
  auto op = block->add_ops();
  op->set_type(type);
  for (auto kv : inputs) {
    auto X = op->add_inputs();
    X->set_parameter(kv.first);
    for (auto argu : kv.second) {
      X->add_arguments(argu);
    }
  }
  for (auto kv : outputs) {
    auto X = op->add_outputs();
    X->set_parameter(kv.first);
    for (auto argu : kv.second) {
      X->add_arguments(argu);
    }
  }
  for (auto& attr : attrs) {
    auto* attr_desc = op->add_attrs();
    attr_desc->set_name(attr.first);
    attr_desc->set_type(
        static_cast<paddle::framework::AttrType>(attr.second.which() - 1));
    SetAttrDescVisitor visitor(attr_desc);
    boost::apply_visitor(visitor, attr.second);
  }
}

void add_gaussian_random_op(string var_name, std::vector<int> dim,
                            proto_block* block) {
  // insert variable
  auto a = block->add_vars();
  a->set_name(var_name);
  auto a_lt = a->mutable_lod_tensor();
  a_lt->set_data_type(paddle::framework::DataType::FP32);
  for (int i : dim) {
    a_lt->add_dims(i);
  }

  // insert operation
  auto op = block->add_ops();
  op->set_type("gaussian_random");
  auto dims = op->add_attrs();
  dims->set_name("dims");
  dims->set_type(paddle::framework::AttrType::INTS);
  for (int i : dim) {
    dims->add_ints(i);
  }
  auto Out = op->add_outputs();
  Out->set_parameter("Out");
  Out->add_arguments(var_name);
}

void add_feed_op(string var_name, std::vector<int>& dim, int index,
                 proto_block* block) {
  // insert variable
  auto a = block->add_vars();
  a->set_name(var_name);
  auto a_lt = a->mutable_lod_tensor();
  a_lt->set_data_type(paddle::framework::DataType::FP32);
  for (int i : dim) {
    a_lt->add_dims(i);
  }

  // insert operation
  auto op = block->add_ops();
  op->set_type("feed");

  // set dims attr
  auto dims = op->add_attrs();
  dims->set_name("dims");
  dims->set_type(paddle::framework::AttrType::INTS);
  for (int i : dim) {
    dims->add_ints(i);
  }

  // set col attr
  auto col = op->add_attrs();
  col->set_name("col");
  col->set_type(paddle::framework::AttrType::INT);
  col->set_i(index);

  auto Out = op->add_outputs();
  Out->set_parameter("Out");
  Out->add_arguments(var_name);
}

void add_fetch_op(string var_name, std::vector<int> dim, int index,
                  proto_block* block) {
  // insert variable
  auto a = block->add_vars();
  a->set_name(var_name);
  auto a_lt = a->mutable_lod_tensor();
  a_lt->set_data_type(paddle::framework::DataType::FP32);
  for (int i : dim) {
    a_lt->add_dims(i);
  }

  // insert operation
  auto op = block->add_ops();
  op->set_type("fetch");

  // set dims attr
  auto dims = op->add_attrs();
  dims->set_name("dims");
  dims->set_type(paddle::framework::AttrType::INTS);
  for (int i : dim) {
    dims->add_ints(i);
  }

  // set col attr
  auto col = op->add_attrs();
  col->set_name("col");
  col->set_type(paddle::framework::AttrType::INT);
  col->set_i(index);

  auto Out = op->add_inputs();
  Out->set_parameter("Input");
  Out->add_arguments(var_name);
}

void add_mul_op(string X_str, string Y_str, string Out_str,
                proto_block* block) {
  // insert variable
  auto a = block->add_vars();
  a->set_name(Out_str);
  auto a_lt = a->mutable_lod_tensor();
  a_lt->set_data_type(paddle::framework::DataType::FP32);

  // insert op
  auto op = block->add_ops();
  op->set_type("mul");
  auto X = op->add_inputs();
  X->set_parameter("X");
  X->add_arguments(X_str);
  auto Y = op->add_inputs();
  Y->set_parameter("Y");
  Y->add_arguments(Y_str);
  auto Out = op->add_outputs();
  Out->set_parameter("Out");
  Out->add_arguments(Out_str);
}

std::once_flag set_variable_flag;

// Tensors in feed value variable will only be in CPUPlace
// So we can  memcpy the data from vector<T> to feed_value
template <typename T>
void set_feed_variable(const std::vector<std::vector<T>>& inputs) {
  typedef std::vector<paddle::framework::Tensor> FeedInputs;
  Variable* g_feed_value = GetGlobalScope()->FindVar("feed_value");
  FeedInputs& feed_inputs = *(g_feed_value->GetMutable<FeedInputs>());
  auto size = inputs.size();
  feed_inputs.resize(size);
  for (size_t i = 0; i < size; i++) {
    T* dst = feed_inputs[i].mutable_data<T>(
        make_ddim({static_cast<int64_t>(inputs[i].size())}), CPUPlace());
    memcpy(dst, inputs[i].data(), inputs[i].size() * sizeof(T));
  }
}

// Tensors in fetch value variable will only be in CPUPlace
// So we can memcpy the data from fetch_value to vector<T>
template <typename T>
std::vector<std::vector<T>> get_fetch_variable() {
  typedef std::vector<paddle::framework::Tensor> FetchOutputs;
  Variable* g_fetch_value = GetGlobalScope()->FindVar("fetch_value");
  FetchOutputs& fetch_outputs = *(g_fetch_value->GetMutable<FetchOutputs>());

  auto size = fetch_outputs.size();
  std::vector<std::vector<T>> result;
  result.reserve(size);
  for (size_t i = 0; i < size; i++) {
    std::vector<T> tmp;
    tmp.resize(fetch_outputs[i].numel());
    memcpy(tmp.data(), fetch_outputs[i].data<T>(),
           fetch_outputs[i].numel() * sizeof(T));
    result.push_back(tmp);
  }

  return result;
}

class ExecutorTesterRandom : public ::testing::Test {
 public:
  virtual void SetUp() override {
    int input_dim = 5, batch_size = 2, embed_dim = 5;

    // init pdesc
    auto init_root_block = init_pdesc_.add_blocks();
    init_root_block->set_idx(0);
    init_root_block->set_parent_idx(-1);
    AddOp("gaussian_random", {}, {{"Out", {"w1"}}},
          {{"dims", std::vector<int>{input_dim, embed_dim}}}, init_root_block);
    AddOp("gaussian_random", {}, {{"Out", {"w2"}}},
          {{"dims", std::vector<int>{embed_dim, input_dim}}}, init_root_block);
    AddOp("fetch", {{"Input", {"w1"}}}, {},
          {{"dims", std::vector<int>{input_dim, embed_dim}}}, init_root_block);
    AddOp("fetch", {{"Input", {"w2"}}}, {},
          {{"dims", std::vector<int>{embed_dim, input_dim}}}, init_root_block);

    // run pdesc
    auto root_block = pdesc_.add_blocks();
    root_block->set_idx(0);
    root_block->set_parent_idx(-1);

    add_gaussian_random_op("a", {batch_size, input_dim}, root_block);

    add_mul_op("a", "w1", "b", root_block);
    add_mul_op("b", "w2", "a_out", root_block);

    add_fetch_op("a_out", {input_dim, batch_size}, 0, root_block);
  }

 protected:
  ProgramDesc pdesc_;
  ProgramDesc init_pdesc_;
};

class ExecutorTesterFeedAndFetch : public ::testing::Test {
 public:
  virtual void SetUp() override {
    auto root_block = pdesc_.add_blocks();
    root_block->set_idx(0);
    root_block->set_parent_idx(-1);

    std::vector<int> dim{6};

    add_feed_op("a", dim, 0, root_block);
    add_feed_op("b", dim, 1, root_block);
    add_fetch_op("a", dim, 0, root_block);
    add_fetch_op("b", dim, 1, root_block);

    std::vector<float> vec1 = {1.0, 2.0, 3.0, 4.0, 5.0, 6.0};
    std::vector<float> vec2 = {4.0, 5.0, 6.0, 7.0, 8.0, 9.0};
    inputs_.push_back(vec1);
    inputs_.push_back(vec2);
  }

 protected:
  ProgramDesc pdesc_;
  std::vector<std::vector<float>> inputs_;
};

#ifndef PADDLE_WITH_CUDA
TEST_F(ExecutorTesterRandom, CPU) {
  std::vector<Place> places;
  CPUPlace cpu_place;
  places.push_back(cpu_place);

  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  paddle::memory::Used(cpu_place);

  Executor* executor = new Executor(places);
  executor->Run(init_pdesc_, GetGlobalScope());
  executor->Run(pdesc_, GetGlobalScope());
  std::vector<std::vector<float>> result = get_fetch_variable<float>();

  for (auto& vec : result) {
    for (auto& num : vec) {
      std::cout << num << " ";
    }
    std::cout << std::endl;
  }
  delete executor;
}

TEST_F(ExecutorTesterFeedAndFetch, CPU) {
  std::vector<Place> places;
  CPUPlace cpu_place;
  places.push_back(cpu_place);

  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  paddle::memory::Used(cpu_place);

  Executor* executor = new Executor(places);

  // 3 mini-batch
  for (int i = 0; i < 3; i++) {
    set_feed_variable<float>(inputs_);
    executor->Run(pdesc_, GetGlobalScope());
    std::vector<std::vector<float>> result = get_fetch_variable<float>();
    PADDLE_ENFORCE_EQ(result.size(), inputs_.size());
    for (size_t i = 0; i < result.size(); ++i) {
      PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());
      for (size_t j = 0; j < result[i].size(); ++j) {
        PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);
      }
    }
  }

  delete executor;
}
#else
TEST_F(ExecutorTesterRandom, GPU) {
  std::vector<Place> places;
  GPUPlace gpu_place(0);
  places.push_back(gpu_place);

  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  // If paddle is compiled with GPU, both CPU and GPU BuddyAllocator
  // need to be used at first.
  paddle::memory::Used(CPUPlace());
  paddle::memory::Used(gpu_place);

  Executor* executor = new Executor(places);

  LOG(INFO) << "Run Init";
  executor->Run(init_pdesc_, GetGlobalScope());
  LOG(INFO) << "Run";
  executor->Run(pdesc_, GetGlobalScope());
  std::vector<std::vector<float>> result = get_fetch_variable<float>();

  for (auto& vec : result) {
    for (auto& num : vec) {
      std::cout << num << " ";
    }
    std::cout << std::endl;
  }
  delete executor;
}

TEST_F(ExecutorTesterFeedAndFetch, GPU) {
  std::vector<Place> places;
  GPUPlace gpu_place(0);
  places.push_back(gpu_place);
  // We have a global Scope and BuddyAllocator, and we must ensure
  // global BuddyAllocator is initialized before global Scope. Thus,
  // global Scope will deconstruct before BuddyAllocator. Otherwise,
  // "pointer being freed was not allocated" error will appear.
  // If paddle is compiled with GPU, both CPU and GPU BuddyAllocator
  // need to be used at first.
  paddle::memory::Used(CPUPlace());
  paddle::memory::Used(gpu_place);

  Executor* executor = new Executor(places);

  // 3 mini-batch
  for (int i = 0; i < 3; i++) {
    set_feed_variable<float>(inputs_);
    executor->Run(pdesc_, GetGlobalScope());
    std::vector<std::vector<float>> result = get_fetch_variable<float>();
    PADDLE_ENFORCE_EQ(result.size(), inputs_.size());
    for (size_t i = 0; i < result.size(); ++i) {
      PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());
      for (size_t j = 0; j < result[i].size(); ++j) {
        PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);
      }
    }
  }
  delete executor;
}
#endif
add executor class and interface 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.`

			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#include "paddle/framework/executor.h"`
add executor feed operator test 7 years ago			`#include <vector>`
add elementwise_add 7 years ago			`#include "gtest/gtest.h"`
simple test 7 years ago			`#include "paddle/framework/attribute.h"`
Add AddOp 7 years ago			`#include "paddle/framework/block_desc.h"`
add elementwise_add 7 years ago			`#include "paddle/framework/grad_op_builder.h"`
Add AddOp 7 years ago			`#include "paddle/framework/op_desc.h"`
add elementwise_add 7 years ago			`#include "paddle/framework/op_registry.h"`
			`#include "paddle/framework/operator.h"`

			`USE_OP(elementwise_add);`
pass simple elementwise_add op 7 years ago			`USE_OP(gaussian_random);`
add executor feed operator test 7 years ago			`USE_OP(feed);`
add fetch operator 7 years ago			`USE_OP(fetch);`
Add AddOp 7 years ago			`USE_OP(mul);`
add executor class and interface 7 years ago
pass cpu test; gpu seg fault 7 years ago			`using std::string;`
add executor unittest 7 years ago			`using namespace paddle::platform;`
			`using namespace paddle::framework;`

pass simple elementwise_add op 7 years ago			`typedef paddle::framework::BlockDesc proto_block;`
			`typedef paddle::framework::OpDesc proto_op;`

Add AddOp 7 years ago			`struct SetAttrDescVisitor : public boost::static_visitor<void> {`
			`explicit SetAttrDescVisitor(OpDesc::Attr* attr) : attr_(attr) {}`
			`mutable OpDesc::Attr* attr_;`
			`void operator()(int v) const { attr_->set_i(v); }`
			`void operator()(float v) const { attr_->set_f(v); }`
			`void operator()(const std::string& v) const { attr_->set_s(v); }`
			`void operator()(bool b) const { attr_->set_b(b); }`

			`void operator()(const std::vector<int>& v) const {`
			`VectorToRepeated(v, attr_->mutable_ints());`
			`}`
			`void operator()(const std::vector<float>& v) const {`
			`VectorToRepeated(v, attr_->mutable_floats());`
			`}`
			`void operator()(const std::vector<std::string>& v) const {`
			`VectorToRepeated(v, attr_->mutable_strings());`
			`}`
			`void operator()(const std::vector<bool>& v) const {`
			`VectorToRepeated(v, attr_->mutable_bools());`
			`}`
			`void operator()(BlockDesc* desc) const { attr_->set_block_idx(desc->idx()); }`
			`void operator()(boost::blank) const { PADDLE_THROW("Unexpected branch"); }`
			`};`

			`void AddOp(const std::string& type, const VariableNameMap& inputs,`
			`const VariableNameMap& outputs, AttributeMap attrs,`
			`proto_block* block) {`
			`// insert output`
			`for (auto kv : outputs) {`
			`for (auto v : kv.second) {`
			`auto var = block->add_vars();`
			`var->set_name(v);`
			`auto var_lt = var->mutable_lod_tensor();`
			`var_lt->set_data_type(paddle::framework::DataType::FP32);`
			`}`
			`}`

			`// insert op`
			`auto op = block->add_ops();`
			`op->set_type(type);`
			`for (auto kv : inputs) {`
			`auto X = op->add_inputs();`
			`X->set_parameter(kv.first);`
			`for (auto argu : kv.second) {`
			`X->add_arguments(argu);`
			`}`
			`}`
			`for (auto kv : outputs) {`
			`auto X = op->add_outputs();`
			`X->set_parameter(kv.first);`
			`for (auto argu : kv.second) {`
			`X->add_arguments(argu);`
			`}`
			`}`
			`for (auto& attr : attrs) {`
			`auto* attr_desc = op->add_attrs();`
			`attr_desc->set_name(attr.first);`
			`attr_desc->set_type(`
			`static_cast<paddle::framework::AttrType>(attr.second.which() - 1));`
			`SetAttrDescVisitor visitor(attr_desc);`
			`boost::apply_visitor(visitor, attr.second);`
			`}`
			`}`

			`void add_gaussian_random_op(string var_name, std::vector<int> dim,`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`proto_block* block) {`
pass simple elementwise_add op 7 years ago			`// insert variable`
			`auto a = block->add_vars();`
			`a->set_name(var_name);`
			`auto a_lt = a->mutable_lod_tensor();`
			`a_lt->set_data_type(paddle::framework::DataType::FP32);`
			`for (int i : dim) {`
			`a_lt->add_dims(i);`
			`}`

			`// insert operation`
			`auto op = block->add_ops();`
			`op->set_type("gaussian_random");`
			`auto dims = op->add_attrs();`
			`dims->set_name("dims");`
			`dims->set_type(paddle::framework::AttrType::INTS);`
			`for (int i : dim) {`
			`dims->add_ints(i);`
			`}`
			`auto Out = op->add_outputs();`
			`Out->set_parameter("Out");`
			`Out->add_arguments(var_name);`
			`}`

ensure global BuddyAllocator is initialized before global Scope 7 years ago			`void add_feed_op(string var_name, std::vector<int>& dim, int index,`
			`proto_block* block) {`
add executor feed operator test 7 years ago			`// insert variable`
			`auto a = block->add_vars();`
			`a->set_name(var_name);`
			`auto a_lt = a->mutable_lod_tensor();`
			`a_lt->set_data_type(paddle::framework::DataType::FP32);`
			`for (int i : dim) {`
			`a_lt->add_dims(i);`
			`}`

			`// insert operation`
			`auto op = block->add_ops();`
			`op->set_type("feed");`

			`// set dims attr`
			`auto dims = op->add_attrs();`
			`dims->set_name("dims");`
			`dims->set_type(paddle::framework::AttrType::INTS);`
			`for (int i : dim) {`
			`dims->add_ints(i);`
			`}`

			`// set col attr`
			`auto col = op->add_attrs();`
			`col->set_name("col");`
			`col->set_type(paddle::framework::AttrType::INT);`
			`col->set_i(index);`

			`auto Out = op->add_outputs();`
			`Out->set_parameter("Out");`
			`Out->add_arguments(var_name);`
			`}`

Add AddOp 7 years ago			`void add_fetch_op(string var_name, std::vector<int> dim, int index,`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`proto_block* block) {`
add fetch operator 7 years ago			`// insert variable`
			`auto a = block->add_vars();`
			`a->set_name(var_name);`
			`auto a_lt = a->mutable_lod_tensor();`
			`a_lt->set_data_type(paddle::framework::DataType::FP32);`
			`for (int i : dim) {`
			`a_lt->add_dims(i);`
			`}`

			`// insert operation`
			`auto op = block->add_ops();`
			`op->set_type("fetch");`

			`// set dims attr`
			`auto dims = op->add_attrs();`
			`dims->set_name("dims");`
			`dims->set_type(paddle::framework::AttrType::INTS);`
			`for (int i : dim) {`
			`dims->add_ints(i);`
			`}`

			`// set col attr`
			`auto col = op->add_attrs();`
			`col->set_name("col");`
			`col->set_type(paddle::framework::AttrType::INT);`
			`col->set_i(index);`

			`auto Out = op->add_inputs();`
			`Out->set_parameter("Input");`
			`Out->add_arguments(var_name);`
			`}`

Add AddOp 7 years ago			`void add_mul_op(string X_str, string Y_str, string Out_str,`
			`proto_block* block) {`
			`// insert variable`
			`auto a = block->add_vars();`
			`a->set_name(Out_str);`
			`auto a_lt = a->mutable_lod_tensor();`
			`a_lt->set_data_type(paddle::framework::DataType::FP32);`

			`// insert op`
			`auto op = block->add_ops();`
			`op->set_type("mul");`
			`auto X = op->add_inputs();`
			`X->set_parameter("X");`
			`X->add_arguments(X_str);`
			`auto Y = op->add_inputs();`
			`Y->set_parameter("Y");`
			`Y->add_arguments(Y_str);`
			`auto Out = op->add_outputs();`
			`Out->set_parameter("Out");`
			`Out->add_arguments(Out_str);`
			`}`

add executor feed operator test 7 years ago			`std::once_flag set_variable_flag;`

FeedOp and FetchOp unit test 7 years ago			`// Tensors in feed value variable will only be in CPUPlace`
			`// So we can memcpy the data from vector<T> to feed_value`
add executor feed operator test 7 years ago			`template <typename T>`
			`void set_feed_variable(const std::vector<std::vector<T>>& inputs) {`
			`typedef std::vector<paddle::framework::Tensor> FeedInputs;`
follow comments and create local_scope inside executor run method 7 years ago			`Variable* g_feed_value = GetGlobalScope()->FindVar("feed_value");`
add executor feed operator test 7 years ago			`FeedInputs& feed_inputs = *(g_feed_value->GetMutable<FeedInputs>());`
			`auto size = inputs.size();`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`feed_inputs.resize(size);`
add executor feed operator test 7 years ago			`for (size_t i = 0; i < size; i++) {`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`T* dst = feed_inputs[i].mutable_data<T>(`
			`make_ddim({static_cast<int64_t>(inputs[i].size())}), CPUPlace());`
			`memcpy(dst, inputs[i].data(), inputs[i].size() * sizeof(T));`
add executor feed operator test 7 years ago			`}`
			`}`

FeedOp and FetchOp unit test 7 years ago			`// Tensors in fetch value variable will only be in CPUPlace`
			`// So we can memcpy the data from fetch_value to vector<T>`
add fetch operator 7 years ago			`template <typename T>`
			`std::vector<std::vector<T>> get_fetch_variable() {`
			`typedef std::vector<paddle::framework::Tensor> FetchOutputs;`
follow comments and create local_scope inside executor run method 7 years ago			`Variable* g_fetch_value = GetGlobalScope()->FindVar("fetch_value");`
add fetch operator 7 years ago			`FetchOutputs& fetch_outputs = *(g_fetch_value->GetMutable<FetchOutputs>());`

ensure global BuddyAllocator is initialized before global Scope 7 years ago			`auto size = fetch_outputs.size();`
add fetch operator 7 years ago			`std::vector<std::vector<T>> result;`
			`result.reserve(size);`
			`for (size_t i = 0; i < size; i++) {`
			`std::vector<T> tmp;`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`tmp.resize(fetch_outputs[i].numel());`
add fetch operator 7 years ago			`memcpy(tmp.data(), fetch_outputs[i].data<T>(),`
			`fetch_outputs[i].numel() * sizeof(T));`
			`result.push_back(tmp);`
			`}`
FeedOp and FetchOp unit test 7 years ago
add fetch operator 7 years ago			`return result;`
			`}`

add executor feed operator test 7 years ago			`class ExecutorTesterRandom : public ::testing::Test {`
refine codes 7 years ago			`public:`
			`virtual void SetUp() override {`
Add AddOp 7 years ago			`int input_dim = 5, batch_size = 2, embed_dim = 5;`

			`// init pdesc`
			`auto init_root_block = init_pdesc_.add_blocks();`
			`init_root_block->set_idx(0);`
			`init_root_block->set_parent_idx(-1);`
			`AddOp("gaussian_random", {}, {{"Out", {"w1"}}},`
			`{{"dims", std::vector<int>{input_dim, embed_dim}}}, init_root_block);`
			`AddOp("gaussian_random", {}, {{"Out", {"w2"}}},`
			`{{"dims", std::vector<int>{embed_dim, input_dim}}}, init_root_block);`
			`AddOp("fetch", {{"Input", {"w1"}}}, {},`
			`{{"dims", std::vector<int>{input_dim, embed_dim}}}, init_root_block);`
			`AddOp("fetch", {{"Input", {"w2"}}}, {},`
			`{{"dims", std::vector<int>{embed_dim, input_dim}}}, init_root_block);`

			`// run pdesc`
refine codes 7 years ago			`auto root_block = pdesc_.add_blocks();`
			`root_block->set_idx(0);`
			`root_block->set_parent_idx(-1);`

Add AddOp 7 years ago			`add_gaussian_random_op("a", {batch_size, input_dim}, root_block);`
refine codes 7 years ago
Add AddOp 7 years ago			`add_mul_op("a", "w1", "b", root_block);`
			`add_mul_op("b", "w2", "a_out", root_block);`
refine codes 7 years ago
Add AddOp 7 years ago			`add_fetch_op("a_out", {input_dim, batch_size}, 0, root_block);`
refine codes 7 years ago			`}`
simple test 7 years ago
refine codes 7 years ago			`protected:`
			`ProgramDesc pdesc_;`
Add AddOp 7 years ago			`ProgramDesc init_pdesc_;`
refine codes 7 years ago			`};`

FeedOp and FetchOp unit test 7 years ago			`class ExecutorTesterFeedAndFetch : public ::testing::Test {`
add executor feed operator test 7 years ago			`public:`
			`virtual void SetUp() override {`
			`auto root_block = pdesc_.add_blocks();`
			`root_block->set_idx(0);`
			`root_block->set_parent_idx(-1);`

ensure global BuddyAllocator is initialized before global Scope 7 years ago			`std::vector<int> dim{6};`

			`add_feed_op("a", dim, 0, root_block);`
			`add_feed_op("b", dim, 1, root_block);`
prune pass simple test 7 years ago			`add_fetch_op("a", dim, 0, root_block);`
FeedOp and FetchOp unit test 7 years ago			`add_fetch_op("b", dim, 1, root_block);`
add fetch operator 7 years ago
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`std::vector<float> vec1 = {1.0, 2.0, 3.0, 4.0, 5.0, 6.0};`
			`std::vector<float> vec2 = {4.0, 5.0, 6.0, 7.0, 8.0, 9.0};`
add executor feed operator test 7 years ago			`inputs_.push_back(vec1);`
			`inputs_.push_back(vec2);`
			`}`

			`protected:`
			`ProgramDesc pdesc_;`
			`std::vector<std::vector<float>> inputs_;`
			`};`

fix executor gpu unittest runtime error 7 years ago			`#ifndef PADDLE_WITH_CUDA`
add executor feed operator test 7 years ago			`TEST_F(ExecutorTesterRandom, CPU) {`
follow comments 7 years ago			`std::vector<Place> places;`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`CPUPlace cpu_place;`
			`places.push_back(cpu_place);`

			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`paddle::memory::Used(cpu_place);`
follow comments 7 years ago
done merged 7 years ago			`Executor* executor = new Executor(places);`
Add AddOp 7 years ago			`executor->Run(init_pdesc_, GetGlobalScope());`
follow comments and create local_scope inside executor run method 7 years ago			`executor->Run(pdesc_, GetGlobalScope());`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`std::vector<std::vector<float>> result = get_fetch_variable<float>();`
FeedOp and FetchOp unit test 7 years ago
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`for (auto& vec : result) {`
			`for (auto& num : vec) {`
			`std::cout << num << " ";`
			`}`
			`std::cout << std::endl;`
			`}`
add executor feed operator test 7 years ago			`delete executor;`
			`}`

FeedOp and FetchOp unit test 7 years ago			`TEST_F(ExecutorTesterFeedAndFetch, CPU) {`
add executor feed operator test 7 years ago			`std::vector<Place> places;`
			`CPUPlace cpu_place;`
			`places.push_back(cpu_place);`

ensure global BuddyAllocator is initialized before global Scope 7 years ago			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`paddle::memory::Used(cpu_place);`

add executor feed operator test 7 years ago			`Executor* executor = new Executor(places);`

			`// 3 mini-batch`
			`for (int i = 0; i < 3; i++) {`
			`set_feed_variable<float>(inputs_);`
follow comments and create local_scope inside executor run method 7 years ago			`executor->Run(pdesc_, GetGlobalScope());`
add fetch operator 7 years ago			`std::vector<std::vector<float>> result = get_fetch_variable<float>();`
FeedOp and FetchOp unit test 7 years ago			`PADDLE_ENFORCE_EQ(result.size(), inputs_.size());`
			`for (size_t i = 0; i < result.size(); ++i) {`
			`PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());`
			`for (size_t j = 0; j < result[i].size(); ++j) {`
			`PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);`
add fetch operator 7 years ago			`}`
			`}`
add executor feed operator test 7 years ago			`}`

refine codes 7 years ago			`delete executor;`
			`}`
fix executor gpu unittest runtime error 7 years ago			`#else`
add executor feed operator test 7 years ago			`TEST_F(ExecutorTesterRandom, GPU) {`
			`std::vector<Place> places;`
			`GPUPlace gpu_place(0);`
			`places.push_back(gpu_place);`

fix executor gpu unittest runtime error 7 years ago			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`// If paddle is compiled with GPU, both CPU and GPU BuddyAllocator`
			`// need to be used at first.`
			`paddle::memory::Used(CPUPlace());`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`paddle::memory::Used(gpu_place);`

add executor feed operator test 7 years ago			`Executor* executor = new Executor(places);`
Add AddOp 7 years ago
			`LOG(INFO) << "Run Init";`
			`executor->Run(init_pdesc_, GetGlobalScope());`
			`LOG(INFO) << "Run";`
follow comments and create local_scope inside executor run method 7 years ago			`executor->Run(pdesc_, GetGlobalScope());`
Add AddOp 7 years ago			`std::vector<std::vector<float>> result = get_fetch_variable<float>();`

			`for (auto& vec : result) {`
			`for (auto& num : vec) {`
			`std::cout << num << " ";`
			`}`
			`std::cout << std::endl;`
			`}`
add executor feed operator test 7 years ago			`delete executor;`
			`}`

FeedOp and FetchOp unit test 7 years ago			`TEST_F(ExecutorTesterFeedAndFetch, GPU) {`
refine codes 7 years ago			`std::vector<Place> places;`
add executor feed operator test 7 years ago			`GPUPlace gpu_place(0);`
			`places.push_back(gpu_place);`
fix executor gpu unittest runtime error 7 years ago			`// We have a global Scope and BuddyAllocator, and we must ensure`
			`// global BuddyAllocator is initialized before global Scope. Thus,`
			`// global Scope will deconstruct before BuddyAllocator. Otherwise,`
			`// "pointer being freed was not allocated" error will appear.`
			`// If paddle is compiled with GPU, both CPU and GPU BuddyAllocator`
			`// need to be used at first.`
			`paddle::memory::Used(CPUPlace());`
ensure global BuddyAllocator is initialized before global Scope 7 years ago			`paddle::memory::Used(gpu_place);`

refine codes 7 years ago			`Executor* executor = new Executor(places);`
add executor feed operator test 7 years ago
fix executor gpu unittest 7 years ago			`// 3 mini-batch`
			`for (int i = 0; i < 3; i++) {`
			`set_feed_variable<float>(inputs_);`
follow comments and create local_scope inside executor run method 7 years ago			`executor->Run(pdesc_, GetGlobalScope());`
fix executor gpu unittest 7 years ago			`std::vector<std::vector<float>> result = get_fetch_variable<float>();`
FeedOp and FetchOp unit test 7 years ago			`PADDLE_ENFORCE_EQ(result.size(), inputs_.size());`
			`for (size_t i = 0; i < result.size(); ++i) {`
			`PADDLE_ENFORCE_EQ(result[i].size(), inputs_[i].size());`
			`for (size_t j = 0; j < result[i].size(); ++j) {`
			`PADDLE_ENFORCE_EQ(result[i][j], inputs_[i][j]);`
fix executor gpu unittest 7 years ago			`}`
			`}`
			`}`
fix gpu build error 7 years ago			`delete executor;`
simple test 7 years ago			`}`
refine codes 7 years ago			`#endif`