Paddle/paddle/gserver/tests/test_RecurrentGradientMachi...

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include <gtest/gtest.h>
#include <paddle/gserver/gradientmachines/GradientMachine.h>
#include <paddle/trainer/Trainer.h>
#include <paddle/trainer/TrainerInternal.h>
#include <paddle/utils/PythonUtil.h>
#include <paddle/utils/Util.h>
#include <paddle/utils/Version.h>

P_DECLARE_int32(seed);

using namespace paddle;  // NOLINT
using namespace std;     // NOLINT
class TrainerForTest : public paddle::Trainer {
public:
  void startTrain() {
    GradientMachine& gm = *this->trainerInternal_.getGradientMachine();
    gm.start(this->getConfig(), dataProvider_);
  }

  void finishTrain() {
    GradientMachine& gm = *this->trainerInternal_.getGradientMachine();
    gm.finish();
  }

  /**
   * Get total dimension of all parameters.
   *
   * @return the total dimension of all parameters
   */
  size_t getTotalParameterSize() const {
    auto p = const_cast<TrainerForTest*>(this);
    auto& params = p->getGradientMachine()->getParameters();
    return std::accumulate(
        params.begin(), params.end(), 0UL, [](size_t a, const ParameterPtr& p) {
          return a + p->getSize();
        });
  }
};

void CalCost(const string& conf,
             const string& dir,
             real* cost,
             int num_passes) {
  auto config = std::make_shared<TrainerConfigHelper>(conf);
  TrainerForTest trainer;
  trainer.init(config);
  mkDir(dir.c_str());
  config->setSaveDir(dir);
  auto dataProvider = trainer.getDataProvider();
  int32_t batchSize = config->getOptConfig().batch_size();
  real learningRate = config->getOptConfig().learning_rate();
  real momentum = 0;
  real decayRate = 0;
  int64_t dim = trainer.getTotalParameterSize();
  CpuVector vecW(dim);
  CpuVector vecGradient(dim);
  CpuVector vecMomentum(dim);

  // vecW needs to be assigned, otherwise the variable is an uncertain value.

  *ThreadLocalRand::getSeed() = FLAGS_seed;
  vecW.randnorm(0, 0.1);
  vecMomentum.randnorm(0, 0.1);

  trainer.startTrain();
  for (int i = 0; i < num_passes; ++i) {
    real totalCost = 0;
    dataProvider->reset();
    while (true) {
      DataBatch dataBatch;
      int num = dataProvider->getNextBatch(batchSize, &dataBatch);
      if (num == 0) break;
      totalCost += trainer.calcGradient(dataBatch, vecW, vecGradient);
      sgdUpdate(
          learningRate, momentum, decayRate, &vecW, &vecGradient, &vecMomentum);
    }
    cost[i] = totalCost;
  }
  trainer.finishTrain();
  rmDir(dir.c_str());
}

void test(const string& conf1, const string& conf2, double eps, bool useGpu) {
  if (!paddle::version::isWithGpu() && useGpu) {
    return;
  }
  FLAGS_use_gpu = useGpu;
  int num_passes = 5;
  real* cost1 = new real[num_passes];
  const string dir1 = "gserver/tests/t1";
  CalCost(conf1, dir1, cost1, num_passes);

  real* cost2 = new real[num_passes];
  const string dir2 = "gserver/tests/t2";
  CalCost(conf2, dir2, cost2, num_passes);

  for (int i = 0; i < num_passes; i++) {
    LOG(INFO) << "num_passes: " << i << ", cost1=" << cost1[i]
              << ", cost2=" << cost2[i]
              << ", diff=" << std::abs(cost1[i] - cost2[i]);
    ASSERT_NEAR(cost1[i], cost2[i], eps);
  }
  delete[] cost1;
  delete[] cost2;
}

TEST(RecurrentGradientMachine, HasSubSequence) {
  for (bool useGpu : {false, true}) {
    test("gserver/tests/sequence_layer_group.conf",
         "gserver/tests/sequence_nest_layer_group.conf",
         1e-5,
         useGpu);
  }
}

TEST(RecurrentGradientMachine, rnn) {
  for (bool useGpu : {false, true}) {
    test("gserver/tests/sequence_rnn.conf",
         "gserver/tests/sequence_nest_rnn.conf",
         1e-6,
         useGpu);
  }
}

TEST(RecurrentGradientMachine, rnn_multi_input) {
  for (bool useGpu : {false, true}) {
    test("gserver/tests/sequence_rnn_multi_input.conf",
         "gserver/tests/sequence_nest_rnn_multi_input.conf",
         1e-6,
         useGpu);
  }
}

TEST(RecurrentGradientMachine, rnn_multi_unequalength_input) {
  for (bool useGpu : {false, true}) {
    test("gserver/tests/sequence_rnn_multi_unequalength_inputs.py",
         "gserver/tests/sequence_nest_rnn_multi_unequalength_inputs.py",
         1e-6,
         useGpu);
  }
}

int main(int argc, char** argv) {
  if (paddle::version::isWithPyDataProvider()) {
    if (!paddle::version::isWithGpu()) {
      FLAGS_use_gpu = false;
    }
    initMain(argc, argv);
    initPython(argc, argv);
    testing::InitGoogleTest(&argc, argv);
    return RUN_ALL_TESTS();
  } else {
    return 0;
  }
}
Change "Baidu, Inc" into "PaddlePaddle Authors" 8 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago
			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

			`#include <gtest/gtest.h>`
Format sequence_nest_rnn_multi_unequalength*.conf 8 years ago			`#include <paddle/gserver/gradientmachines/GradientMachine.h>`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`#include <paddle/trainer/Trainer.h>`
			`#include <paddle/trainer/TrainerInternal.h>`
Format sequence_nest_rnn_multi_unequalength*.conf 8 years ago			`#include <paddle/utils/PythonUtil.h>`
			`#include <paddle/utils/Util.h>`
			`#include <paddle/utils/Version.h>`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago
Correctly handle memory in RecurrentGradientMachine for hirarchical RNN Change-Id: I8e0a8ea6fc2760652d9c76440a539c90860062d3 9 years ago			`P_DECLARE_int32(seed);`

fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`using namespace paddle; // NOLINT`
hierarchical rnn document, add new config example (#106) * hierarchical rnn document, add new config example * update inputs_type of label * add check for unsupported config * refine hierarchical document * refine doc title * update docs, fix paddle to PaddlePaddle * follow comments 8 years ago			`using namespace std; // NOLINT`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`class TrainerForTest : public paddle::Trainer {`
			`public:`
			`void startTrain() {`
			`GradientMachine& gm = *this->trainerInternal_.getGradientMachine();`
			`gm.start(this->getConfig(), dataProvider_);`
			`}`

			`void finishTrain() {`
			`GradientMachine& gm = *this->trainerInternal_.getGradientMachine();`
			`gm.finish();`
			`}`

			`/**`
			`* Get total dimension of all parameters.`
			`*`
			`* @return the total dimension of all parameters`
			`*/`
			`size_t getTotalParameterSize() const {`
			`auto p = const_cast<TrainerForTest*>(this);`
hierarchical rnn document, add new config example (#106) * hierarchical rnn document, add new config example * update inputs_type of label * add check for unsupported config * refine hierarchical document * refine doc title * update docs, fix paddle to PaddlePaddle * follow comments 8 years ago			`auto& params = p->getGradientMachine()->getParameters();`
			`return std::accumulate(`
Format sequence_nest_rnn_multi_unequalength*.conf 8 years ago			`params.begin(), params.end(), 0UL, [](size_t a, const ParameterPtr& p) {`
			`return a + p->getSize();`
			`});`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`}`
			`};`

clang format .cc .h .cpp .c and .hpp file 8 years ago			`void CalCost(const string& conf,`
			`const string& dir,`
			`real* cost,`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`int num_passes) {`
			`auto config = std::make_shared<TrainerConfigHelper>(conf);`
			`TrainerForTest trainer;`
			`trainer.init(config);`
			`mkDir(dir.c_str());`
			`config->setSaveDir(dir);`
			`auto dataProvider = trainer.getDataProvider();`
			`int32_t batchSize = config->getOptConfig().batch_size();`
			`real learningRate = config->getOptConfig().learning_rate();`
			`real momentum = 0;`
			`real decayRate = 0;`
			`int64_t dim = trainer.getTotalParameterSize();`
			`CpuVector vecW(dim);`
			`CpuVector vecGradient(dim);`
			`CpuVector vecMomentum(dim);`

			`// vecW needs to be assigned, otherwise the variable is an uncertain value.`
Correctly handle memory in RecurrentGradientMachine for hirarchical RNN Change-Id: I8e0a8ea6fc2760652d9c76440a539c90860062d3 9 years ago
			`*ThreadLocalRand::getSeed() = FLAGS_seed;`
			`vecW.randnorm(0, 0.1);`
add interface and test of RecurrentGradientMachine (#156) * add interface and unittest of RecurrentGradientMachine for the function of multiple Subsequence inlinks with unequal token length 8 years ago			`vecMomentum.randnorm(0, 0.1);`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago
			`trainer.startTrain();`
			`for (int i = 0; i < num_passes; ++i) {`
			`real totalCost = 0;`
			`dataProvider->reset();`
			`while (true) {`
			`DataBatch dataBatch;`
			`int num = dataProvider->getNextBatch(batchSize, &dataBatch);`
			`if (num == 0) break;`
			`totalCost += trainer.calcGradient(dataBatch, vecW, vecGradient);`
clang format .cc .h .cpp .c and .hpp file 8 years ago			`sgdUpdate(`
			`learningRate, momentum, decayRate, &vecW, &vecGradient, &vecMomentum);`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`}`
			`cost[i] = totalCost;`
			`}`
			`trainer.finishTrain();`
			`rmDir(dir.c_str());`
			`}`

Correctly handling multiple inputs and integer inputs for recurrent_g… (#114) * Correctly handling multiple inputs and integer inputs for recurrent_group * Fix ScatterAgentLayer for generation * Revert sequence_(nest)_rnn.conf 9 years ago			`void test(const string& conf1, const string& conf2, double eps, bool useGpu) {`
			`if (!paddle::version::isWithGpu() && useGpu) {`
			`return;`
			`}`
			`FLAGS_use_gpu = useGpu;`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`int num_passes = 5;`
			`real* cost1 = new real[num_passes];`
			`const string dir1 = "gserver/tests/t1";`
			`CalCost(conf1, dir1, cost1, num_passes);`

			`real* cost2 = new real[num_passes];`
			`const string dir2 = "gserver/tests/t2";`
			`CalCost(conf2, dir2, cost2, num_passes);`

			`for (int i = 0; i < num_passes; i++) {`
			`LOG(INFO) << "num_passes: " << i << ", cost1=" << cost1[i]`
Further fix the memory for Hierarchical RNN Sequences should be sorted according to the number of subsequences they have. 9 years ago			`<< ", cost2=" << cost2[i]`
			`<< ", diff=" << std::abs(cost1[i] - cost2[i]);`
			`ASSERT_NEAR(cost1[i], cost2[i], eps);`
fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`}`
			`delete[] cost1;`
			`delete[] cost2;`
			`}`

Correctly handle memory in RecurrentGradientMachine for hirarchical RNN Change-Id: I8e0a8ea6fc2760652d9c76440a539c90860062d3 9 years ago			`TEST(RecurrentGradientMachine, HasSubSequence) {`
Correctly handling multiple inputs and integer inputs for recurrent_g… (#114) * Correctly handling multiple inputs and integer inputs for recurrent_group * Fix ScatterAgentLayer for generation * Revert sequence_(nest)_rnn.conf 9 years ago			`for (bool useGpu : {false, true}) {`
			`test("gserver/tests/sequence_layer_group.conf",`
			`"gserver/tests/sequence_nest_layer_group.conf",`
clang format .cc .h .cpp .c and .hpp file 8 years ago			`1e-5,`
			`useGpu);`
Correctly handling multiple inputs and integer inputs for recurrent_g… (#114) * Correctly handling multiple inputs and integer inputs for recurrent_group * Fix ScatterAgentLayer for generation * Revert sequence_(nest)_rnn.conf 9 years ago			`}`
Correctly handle memory in RecurrentGradientMachine for hirarchical RNN Change-Id: I8e0a8ea6fc2760652d9c76440a539c90860062d3 9 years ago			`}`

			`TEST(RecurrentGradientMachine, rnn) {`
Correctly handling multiple inputs and integer inputs for recurrent_g… (#114) * Correctly handling multiple inputs and integer inputs for recurrent_group * Fix ScatterAgentLayer for generation * Revert sequence_(nest)_rnn.conf 9 years ago			`for (bool useGpu : {false, true}) {`
			`test("gserver/tests/sequence_rnn.conf",`
			`"gserver/tests/sequence_nest_rnn.conf",`
clang format .cc .h .cpp .c and .hpp file 8 years ago			`1e-6,`
			`useGpu);`
Correctly handling multiple inputs and integer inputs for recurrent_g… (#114) * Correctly handling multiple inputs and integer inputs for recurrent_group * Fix ScatterAgentLayer for generation * Revert sequence_(nest)_rnn.conf 9 years ago			`}`
Correctly handle memory in RecurrentGradientMachine for hirarchical RNN Change-Id: I8e0a8ea6fc2760652d9c76440a539c90860062d3 9 years ago			`}`

Correctly handling multiple inputs and integer inputs for recurrent_g… (#114) * Correctly handling multiple inputs and integer inputs for recurrent_group * Fix ScatterAgentLayer for generation * Revert sequence_(nest)_rnn.conf 9 years ago			`TEST(RecurrentGradientMachine, rnn_multi_input) {`
			`for (bool useGpu : {false, true}) {`
			`test("gserver/tests/sequence_rnn_multi_input.conf",`
			`"gserver/tests/sequence_nest_rnn_multi_input.conf",`
clang format .cc .h .cpp .c and .hpp file 8 years ago			`1e-6,`
			`useGpu);`
Correctly handling multiple inputs and integer inputs for recurrent_g… (#114) * Correctly handling multiple inputs and integer inputs for recurrent_group * Fix ScatterAgentLayer for generation * Revert sequence_(nest)_rnn.conf 9 years ago			`}`
			`}`
Correctly handle memory in RecurrentGradientMachine for hirarchical RNN Change-Id: I8e0a8ea6fc2760652d9c76440a539c90860062d3 9 years ago
add interface and test of RecurrentGradientMachine (#156) * add interface and unittest of RecurrentGradientMachine for the function of multiple Subsequence inlinks with unequal token length 8 years ago			`TEST(RecurrentGradientMachine, rnn_multi_unequalength_input) {`
clang format .cc .h .cpp .c and .hpp file 8 years ago			`for (bool useGpu : {false, true}) {`
Format sequence_nest_rnn_multi_unequalength*.conf 8 years ago			`test("gserver/tests/sequence_rnn_multi_unequalength_inputs.py",`
			`"gserver/tests/sequence_nest_rnn_multi_unequalength_inputs.py",`
clang format .cc .h .cpp .c and .hpp file 8 years ago			`1e-6,`
			`useGpu);`
			`}`
add interface and test of RecurrentGradientMachine (#156) * add interface and unittest of RecurrentGradientMachine for the function of multiple Subsequence inlinks with unequal token length 8 years ago			`}`

fix dash and space bug, ISSUE=4586495 git-svn-id: https://svn.baidu.com/idl/trunk/paddle@1408 1ad973e4-5ce8-4261-8a94-b56d1f490c56 9 years ago			`int main(int argc, char** argv) {`
			`if (paddle::version::isWithPyDataProvider()) {`
			`if (!paddle::version::isWithGpu()) {`
			`FLAGS_use_gpu = false;`
			`}`
			`initMain(argc, argv);`
			`initPython(argc, argv);`
			`testing::InitGoogleTest(&argc, argv);`
			`return RUN_ALL_TESTS();`
			`} else {`
			`return 0;`
			`}`
			`}`