/** * Copyright 2020 Huawei Technologies Co., Ltd * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include #include #include #include "dataset/core/client.h" #include "common/common.h" #include "common/utils.h" #include "gtest/gtest.h" #include "utils/log_adapter.h" #include "dataset/engine/datasetops/source/text_file_op.h" #include "dataset/util/status.h" namespace common = mindspore::common; using namespace mindspore::dataset; using mindspore::MsLogLevel::INFO; using mindspore::ExceptionType::NoExceptionType; using mindspore::LogStream; class MindDataTestTextFileOp : public UT::DatasetOpTesting { }; TEST_F(MindDataTestTextFileOp, TestTextFileBasic) { // Start with an empty execution tree auto tree = std::make_shared(); std::string dataset_path; dataset_path = datasets_root_path_ + "/testTextFileDataset/1.txt"; std::shared_ptr op; TextFileOp::Builder builder; builder.SetTextFilesList({dataset_path}) .SetRowsPerBuffer(16) .SetNumWorkers(16) .SetOpConnectorSize(2); Status rc = builder.Build(&op); ASSERT_TRUE(rc.IsOk()); rc = tree->AssociateNode(op); ASSERT_TRUE(rc.IsOk()); rc = tree->AssignRoot(op); ASSERT_TRUE(rc.IsOk()); MS_LOG(INFO) << "Launching tree and begin iteration."; rc = tree->Prepare(); ASSERT_TRUE(rc.IsOk()); rc = tree->Launch(); ASSERT_TRUE(rc.IsOk()); // Start the loop of reading tensors from our pipeline DatasetIterator di(tree); TensorRow tensor_list; rc = di.FetchNextTensorRow(&tensor_list); ASSERT_TRUE(rc.IsOk()); int row_count = 0; while (!tensor_list.empty()) { // Display the tensor by calling the printer on it for (int i = 0; i < tensor_list.size(); i++) { std::ostringstream ss; ss << "(" << tensor_list[i] << "): " << *tensor_list[i] << std::endl; MS_LOG(INFO) << "Tensor print: " << ss.str() << "."; } rc = di.FetchNextTensorRow(&tensor_list); ASSERT_TRUE(rc.IsOk()); row_count++; } ASSERT_EQ(row_count, 3); } TEST_F(MindDataTestTextFileOp, TestTotalRows) { std::string tf_file1 = datasets_root_path_ + "/testTextFileDataset/1.txt"; std::string tf_file2 = datasets_root_path_ + "/testTextFileDataset/2.txt"; std::vector files; files.push_back(tf_file1); int64_t total_rows = 0; TextFileOp::CountAllFileRows(files, &total_rows); ASSERT_EQ(total_rows, 3); files.clear(); files.push_back(tf_file2); TextFileOp::CountAllFileRows(files, &total_rows); ASSERT_EQ(total_rows, 2); files.clear(); files.push_back(tf_file1); files.push_back(tf_file2); TextFileOp::CountAllFileRows(files, &total_rows); ASSERT_EQ(total_rows, 5); files.clear(); }