Paddle/paddle/fluid/inference/tests/api/analyzer_ner_tester.cc

// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/inference/tests/api/tester_helper.h"

namespace paddle {
namespace inference {
using contrib::AnalysisConfig;

struct DataRecord {
  std::vector<std::vector<int64_t>> word_data_all, mention_data_all;
  std::vector<size_t> lod;  // two inputs have the same lod info.
  size_t batch_iter{0};
  size_t batch_size{1};
  size_t num_samples;  // total number of samples
  DataRecord() = default;
  explicit DataRecord(const std::string &path, int batch_size = 1)
      : batch_size(batch_size) {
    Load(path);
  }
  DataRecord NextBatch() {
    DataRecord data;
    size_t batch_end = batch_iter + batch_size;
    // NOTE skip the final batch, if no enough data is provided.
    if (batch_end <= word_data_all.size()) {
      data.word_data_all.assign(word_data_all.begin() + batch_iter,
                                word_data_all.begin() + batch_end);
      data.mention_data_all.assign(mention_data_all.begin() + batch_iter,
                                   mention_data_all.begin() + batch_end);
      // Prepare LoDs
      data.lod.push_back(0);
      CHECK(!data.word_data_all.empty());
      CHECK(!data.mention_data_all.empty());
      CHECK_EQ(data.word_data_all.size(), data.mention_data_all.size());
      for (size_t j = 0; j < data.word_data_all.size(); j++) {
        // calculate lod
        data.lod.push_back(data.lod.back() + data.word_data_all[j].size());
      }
    }
    batch_iter += batch_size;
    return data;
  }
  void Load(const std::string &path) {
    std::ifstream file(path);
    std::string line;
    int num_lines = 0;
    while (std::getline(file, line)) {
      num_lines++;
      std::vector<std::string> data;
      split(line, ';', &data);
      // load word data
      std::vector<int64_t> word_data;
      split_to_int64(data[1], ' ', &word_data);
      // load mention data
      std::vector<int64_t> mention_data;
      split_to_int64(data[3], ' ', &mention_data);
      word_data_all.push_back(std::move(word_data));
      mention_data_all.push_back(std::move(mention_data));
    }
    num_samples = num_lines;
  }
};

void PrepareInputs(std::vector<PaddleTensor> *input_slots, DataRecord *data,
                   int batch_size) {
  PaddleTensor lod_word_tensor, lod_mention_tensor;
  lod_word_tensor.name = "word";
  lod_mention_tensor.name = "mention";
  auto one_batch = data->NextBatch();
  int size = one_batch.lod[one_batch.lod.size() - 1];  // token batch size
  lod_word_tensor.shape.assign({size, 1});
  lod_word_tensor.lod.assign({one_batch.lod});
  lod_mention_tensor.shape.assign({size, 1});
  lod_mention_tensor.lod.assign({one_batch.lod});
  // assign data
  TensorAssignData<int64_t>(&lod_word_tensor, one_batch.word_data_all);
  TensorAssignData<int64_t>(&lod_mention_tensor, one_batch.mention_data_all);
  // Set inputs.
  input_slots->assign({lod_word_tensor, lod_mention_tensor});
  for (auto &tensor : *input_slots) {
    tensor.dtype = PaddleDType::INT64;
  }
}

void SetConfig(contrib::AnalysisConfig *cfg, bool memory_load = false) {
  if (memory_load) {
    std::string buffer_prog, buffer_param;
    ReadBinaryFile(FLAGS_infer_model + "/__model__", &buffer_prog);
    ReadBinaryFile(FLAGS_infer_model + "/param", &buffer_param);
    cfg->SetModelBuffer(&buffer_prog[0], buffer_prog.size(), &buffer_param[0],
                        buffer_param.size());
  } else {
    cfg->prog_file = FLAGS_infer_model + "/__model__";
    cfg->param_file = FLAGS_infer_model + "/param";
  }
  cfg->use_gpu = false;
  cfg->device = 0;
  cfg->specify_input_name = true;
  cfg->enable_ir_optim = true;
}

void SetInput(std::vector<std::vector<PaddleTensor>> *inputs) {
  DataRecord data(FLAGS_infer_data, FLAGS_batch_size);
  std::vector<PaddleTensor> input_slots;
  int epoch = FLAGS_test_all_data ? data.num_samples / FLAGS_batch_size : 1;
  LOG(INFO) << "number of samples: " << epoch * FLAGS_batch_size;
  for (int bid = 0; bid < epoch; ++bid) {
    PrepareInputs(&input_slots, &data, FLAGS_batch_size);
    (*inputs).emplace_back(input_slots);
  }
}

// Easy for profiling independently.
void profile(bool memory_load = false) {
  contrib::AnalysisConfig cfg;
  SetConfig(&cfg, memory_load);
  std::vector<PaddleTensor> outputs;

  std::vector<std::vector<PaddleTensor>> input_slots_all;
  SetInput(&input_slots_all);
  TestPrediction(reinterpret_cast<const PaddlePredictor::Config *>(&cfg),
                 input_slots_all, &outputs, FLAGS_num_threads);

  if (FLAGS_num_threads == 1 && !FLAGS_test_all_data) {
    // the first inference result
    const int chinese_ner_result_data[] = {30, 45, 41, 48, 17, 26,
                                           48, 39, 38, 16, 25};
    PADDLE_ENFORCE_EQ(outputs.size(), 1UL);
    size_t size = GetSize(outputs[0]);
    PADDLE_ENFORCE_GT(size, 0);
    int64_t *result = static_cast<int64_t *>(outputs[0].data.data());
    for (size_t i = 0; i < std::min(11UL, size); i++) {
      EXPECT_EQ(result[i], chinese_ner_result_data[i]);
    }
  }
}

TEST(Analyzer_Chinese_ner, profile) { profile(); }

TEST(Analyzer_Chinese_ner, profile_memory_load) {
  profile(true /* memory_load */);
}

// Check the fuse status
TEST(Analyzer_Chinese_ner, fuse_statis) {
  contrib::AnalysisConfig cfg;
  SetConfig(&cfg);

  int num_ops;
  auto predictor = CreatePaddlePredictor<AnalysisConfig>(cfg);
  auto fuse_statis = GetFuseStatis(
      static_cast<AnalysisPredictor *>(predictor.get()), &num_ops);
  ASSERT_TRUE(fuse_statis.count("fc_fuse"));
  ASSERT_TRUE(fuse_statis.count("fc_gru_fuse"));
  EXPECT_EQ(fuse_statis.at("fc_fuse"), 1);
  EXPECT_EQ(fuse_statis.at("fc_gru_fuse"), 2);
  EXPECT_EQ(num_ops, 14);
}

// Compare result of NativeConfig and AnalysisConfig
TEST(Analyzer_Chinese_ner, compare) {
  contrib::AnalysisConfig cfg;
  SetConfig(&cfg);

  std::vector<std::vector<PaddleTensor>> input_slots_all;
  SetInput(&input_slots_all);
  CompareNativeAndAnalysis(
      reinterpret_cast<const PaddlePredictor::Config *>(&cfg), input_slots_all);
}

// Compare Deterministic result
TEST(Analyzer_Chinese_ner, compare_determine) {
  AnalysisConfig cfg;
  SetConfig(&cfg);

  std::vector<std::vector<PaddleTensor>> input_slots_all;
  SetInput(&input_slots_all);
  CompareDeterministic(reinterpret_cast<const PaddlePredictor::Config *>(&cfg),
                       input_slots_all);
}

}  // namespace inference
}  // namespace paddle
add unit-test for chinese_ner 7 years ago			`// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`

add multi-thread for nlp unit-tests 7 years ago			`#include "paddle/fluid/inference/tests/api/tester_helper.h"`
add unit-test for chinese_ner 7 years ago
			`namespace paddle {`
			`namespace inference {`
fea/infer executor and concurrency performance issue bug fix (#13451) - add naive executor - fix concurrency performance issue 6 years ago			`using contrib::AnalysisConfig;`
add unit-test for chinese_ner 7 years ago
			`struct DataRecord {`
			`std::vector<std::vector<int64_t>> word_data_all, mention_data_all;`
			`std::vector<size_t> lod; // two inputs have the same lod info.`
			`size_t batch_iter{0};`
			`size_t batch_size{1};`
add test_all_data in test_analyzer_ner 7 years ago			`size_t num_samples; // total number of samples`
add unit-test for chinese_ner 7 years ago			`DataRecord() = default;`
			`explicit DataRecord(const std::string &path, int batch_size = 1)`
			`: batch_size(batch_size) {`
			`Load(path);`
			`}`
			`DataRecord NextBatch() {`
			`DataRecord data;`
			`size_t batch_end = batch_iter + batch_size;`
			`// NOTE skip the final batch, if no enough data is provided.`
			`if (batch_end <= word_data_all.size()) {`
			`data.word_data_all.assign(word_data_all.begin() + batch_iter,`
			`word_data_all.begin() + batch_end);`
			`data.mention_data_all.assign(mention_data_all.begin() + batch_iter,`
			`mention_data_all.begin() + batch_end);`
			`// Prepare LoDs`
			`data.lod.push_back(0);`
			`CHECK(!data.word_data_all.empty());`
			`CHECK(!data.mention_data_all.empty());`
			`CHECK_EQ(data.word_data_all.size(), data.mention_data_all.size());`
			`for (size_t j = 0; j < data.word_data_all.size(); j++) {`
			`// calculate lod`
			`data.lod.push_back(data.lod.back() + data.word_data_all[j].size());`
			`}`
			`}`
			`batch_iter += batch_size;`
			`return data;`
			`}`
			`void Load(const std::string &path) {`
			`std::ifstream file(path);`
			`std::string line;`
			`int num_lines = 0;`
			`while (std::getline(file, line)) {`
			`num_lines++;`
			`std::vector<std::string> data;`
			`split(line, ';', &data);`
			`// load word data`
			`std::vector<int64_t> word_data;`
			`split_to_int64(data[1], ' ', &word_data);`
			`// load mention data`
			`std::vector<int64_t> mention_data;`
			`split_to_int64(data[3], ' ', &mention_data);`
			`word_data_all.push_back(std::move(word_data));`
			`mention_data_all.push_back(std::move(mention_data));`
			`}`
add test_all_data in test_analyzer_ner 7 years ago			`num_samples = num_lines;`
add unit-test for chinese_ner 7 years ago			`}`
			`};`

			`void PrepareInputs(std::vector<PaddleTensor> input_slots, DataRecord data,`
			`int batch_size) {`
			`PaddleTensor lod_word_tensor, lod_mention_tensor;`
			`lod_word_tensor.name = "word";`
			`lod_mention_tensor.name = "mention";`
			`auto one_batch = data->NextBatch();`
			`int size = one_batch.lod[one_batch.lod.size() - 1]; // token batch size`
			`lod_word_tensor.shape.assign({size, 1});`
			`lod_word_tensor.lod.assign({one_batch.lod});`
			`lod_mention_tensor.shape.assign({size, 1});`
			`lod_mention_tensor.lod.assign({one_batch.lod});`
			`// assign data`
Nlp dam (#14248) * add dam test * update fuse_statis * use separated dam model. * Revert "use separated dam model." This reverts commit 13e775c86f909b164b7cc1d35a8a24b964ec622e. * test=develop * modify the cmake file about infer test, test=develop. * remove one comment, test=develop. 6 years ago			`TensorAssignData<int64_t>(&lod_word_tensor, one_batch.word_data_all);`
			`TensorAssignData<int64_t>(&lod_mention_tensor, one_batch.mention_data_all);`
add unit-test for chinese_ner 7 years ago			`// Set inputs.`
			`input_slots->assign({lod_word_tensor, lod_mention_tensor});`
			`for (auto &tensor : *input_slots) {`
			`tensor.dtype = PaddleDType::INT64;`
			`}`
			`}`

support loading from memory test=develop 6 years ago			`void SetConfig(contrib::AnalysisConfig *cfg, bool memory_load = false) {`
			`if (memory_load) {`
			`std::string buffer_prog, buffer_param;`
			`ReadBinaryFile(FLAGS_infer_model + "/__model__", &buffer_prog);`
			`ReadBinaryFile(FLAGS_infer_model + "/param", &buffer_param);`
update with comments test=develop 6 years ago			`cfg->SetModelBuffer(&buffer_prog[0], buffer_prog.size(), &buffer_param[0],`
			`buffer_param.size());`
support loading from memory test=develop 6 years ago			`} else {`
			`cfg->prog_file = FLAGS_infer_model + "/__model__";`
			`cfg->param_file = FLAGS_infer_model + "/param";`
			`}`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`cfg->use_gpu = false;`
			`cfg->device = 0;`
			`cfg->specify_input_name = true;`
			`cfg->enable_ir_optim = true;`
			`}`
add test_all_data in test_analyzer_ner 7 years ago
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`void SetInput(std::vector<std::vector<PaddleTensor>> *inputs) {`
add test_all_data in test_analyzer_ner 7 years ago			`DataRecord data(FLAGS_infer_data, FLAGS_batch_size);`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`std::vector<PaddleTensor> input_slots;`
			`int epoch = FLAGS_test_all_data ? data.num_samples / FLAGS_batch_size : 1;`
			`LOG(INFO) << "number of samples: " << epoch * FLAGS_batch_size;`
			`for (int bid = 0; bid < epoch; ++bid) {`
			`PrepareInputs(&input_slots, &data, FLAGS_batch_size);`
			`(*inputs).emplace_back(input_slots);`
add unit-test for chinese_ner 7 years ago			`}`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`}`
add unit-test for chinese_ner 7 years ago
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`// Easy for profiling independently.`
support loading from memory test=develop 6 years ago			`void profile(bool memory_load = false) {`
refine inference api (#13518) 7 years ago			`contrib::AnalysisConfig cfg;`
support loading from memory test=develop 6 years ago			`SetConfig(&cfg, memory_load);`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`std::vector<PaddleTensor> outputs;`
enable ner analysis test and refine lac 7 years ago
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`std::vector<std::vector<PaddleTensor>> input_slots_all;`
			`SetInput(&input_slots_all);`
Refine tester of TensorRT engine (#14390) * Refine the tester for MixedRTPredictor. test=develop * Enable the profiler in TensorRT engine. * Support the use of combined inference model in TensorRT unittest, and print the shape of feed targets. 6 years ago			`TestPrediction(reinterpret_cast<const PaddlePredictor::Config *>(&cfg),`
			`input_slots_all, &outputs, FLAGS_num_threads);`
enable ner analysis test and refine lac 7 years ago
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`if (FLAGS_num_threads == 1 && !FLAGS_test_all_data) {`
			`// the first inference result`
			`const int chinese_ner_result_data[] = {30, 45, 41, 48, 17, 26,`
			`48, 39, 38, 16, 25};`
			`PADDLE_ENFORCE_EQ(outputs.size(), 1UL);`
			`size_t size = GetSize(outputs[0]);`
			`PADDLE_ENFORCE_GT(size, 0);`
			`int64_t result = static_cast<int64_t >(outputs[0].data.data());`
			`for (size_t i = 0; i < std::min(11UL, size); i++) {`
			`EXPECT_EQ(result[i], chinese_ner_result_data[i]);`
enable ner analysis test and refine lac 7 years ago			`}`
			`}`
add unit-test for chinese_ner 7 years ago			`}`

support loading from memory test=develop 6 years ago			`TEST(Analyzer_Chinese_ner, profile) { profile(); }`

			`TEST(Analyzer_Chinese_ner, profile_memory_load) {`
			`profile(true /* memory_load */);`
			`}`

Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`// Check the fuse status`
			`TEST(Analyzer_Chinese_ner, fuse_statis) {`
refine inference api (#13518) 7 years ago			`contrib::AnalysisConfig cfg;`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`SetConfig(&cfg);`
enable ner analysis test and refine lac 7 years ago
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`int num_ops;`
fea/infer executor and concurrency performance issue bug fix (#13451) - add naive executor - fix concurrency performance issue 6 years ago			`auto predictor = CreatePaddlePredictor<AnalysisConfig>(cfg);`
			`auto fuse_statis = GetFuseStatis(`
			`static_cast<AnalysisPredictor *>(predictor.get()), &num_ops);`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`ASSERT_TRUE(fuse_statis.count("fc_fuse"));`
			`ASSERT_TRUE(fuse_statis.count("fc_gru_fuse"));`
			`EXPECT_EQ(fuse_statis.at("fc_fuse"), 1);`
			`EXPECT_EQ(fuse_statis.at("fc_gru_fuse"), 2);`
			`EXPECT_EQ(num_ops, 14);`
			`}`

			`// Compare result of NativeConfig and AnalysisConfig`
			`TEST(Analyzer_Chinese_ner, compare) {`
refine inference api (#13518) 7 years ago			`contrib::AnalysisConfig cfg;`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`SetConfig(&cfg);`

			`std::vector<std::vector<PaddleTensor>> input_slots_all;`
			`SetInput(&input_slots_all);`
Refine tester of TensorRT engine (#14390) * Refine the tester for MixedRTPredictor. test=develop * Enable the profiler in TensorRT engine. * Support the use of combined inference model in TensorRT unittest, and print the shape of feed targets. 6 years ago			`CompareNativeAndAnalysis(`
			`reinterpret_cast<const PaddlePredictor::Config *>(&cfg), input_slots_all);`
Refine infer api test (#13472) * refine analyzer_nlp_tester * refine analyzer_rnn/vis_tester 7 years ago			`}`
add unit-test for chinese_ner 7 years ago
add deterministic result unit-test test=develop 6 years ago			`// Compare Deterministic result`
			`TEST(Analyzer_Chinese_ner, compare_determine) {`
			`AnalysisConfig cfg;`
			`SetConfig(&cfg);`

			`std::vector<std::vector<PaddleTensor>> input_slots_all;`
			`SetInput(&input_slots_all);`
			`CompareDeterministic(reinterpret_cast<const PaddlePredictor::Config *>(&cfg),`
			`input_slots_all);`
			`}`

add unit-test for chinese_ner 7 years ago			`} // namespace inference`
			`} // namespace paddle`