/** * Copyright 2020 Huawei Technologies Co., Ltd * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include #include #include #include "minddata/dataset/core/client.h" #include "common/common.h" #include "utils/ms_utils.h" #include "gtest/gtest.h" #include "utils/log_adapter.h" #include "minddata/dataset/engine/datasetops/source/csv_op.h" #include "minddata/dataset/util/status.h" namespace common = mindspore::common; using namespace mindspore::dataset; using mindspore::MsLogLevel::INFO; using mindspore::ExceptionType::NoExceptionType; using mindspore::LogStream; class MindDataTestCSVOp : public UT::DatasetOpTesting { }; TEST_F(MindDataTestCSVOp, TestCSVBasic) { // Start with an empty execution tree auto tree = std::make_shared(); std::string dataset_path; dataset_path = datasets_root_path_ + "/testCSV/1.csv"; std::vector> column_default_list; column_default_list.push_back(std::make_shared>(CsvOp::INT, 0)); column_default_list.push_back(std::make_shared>(CsvOp::INT, 0)); column_default_list.push_back(std::make_shared>(CsvOp::INT, 0)); column_default_list.push_back(std::make_shared>(CsvOp::INT, 0)); std::shared_ptr op; CsvOp::Builder builder; builder.SetCsvFilesList({dataset_path}) .SetShuffleFiles(false) .SetOpConnectorSize(2) .SetFieldDelim(',') .SetColumDefault(column_default_list) .SetColumName({"col1", "col2", "col3", "col4"}); Status rc = builder.Build(&op); ASSERT_TRUE(rc.IsOk()); rc = tree->AssociateNode(op); ASSERT_TRUE(rc.IsOk()); rc = tree->AssignRoot(op); ASSERT_TRUE(rc.IsOk()); MS_LOG(INFO) << "Launching tree and begin iteration."; rc = tree->Prepare(); ASSERT_TRUE(rc.IsOk()); rc = tree->Launch(); ASSERT_TRUE(rc.IsOk()); // Start the loop of reading tensors from our pipeline DatasetIterator di(tree); TensorRow tensor_list; rc = di.FetchNextTensorRow(&tensor_list); ASSERT_TRUE(rc.IsOk()); int row_count = 0; while (!tensor_list.empty()) { // Display the tensor by calling the printer on it for (int i = 0; i < tensor_list.size(); i++) { std::ostringstream ss; ss << "(" << tensor_list[i] << "): " << *tensor_list[i] << std::endl; MS_LOG(INFO) << "Tensor print: " << ss.str() << "."; } rc = di.FetchNextTensorRow(&tensor_list); ASSERT_TRUE(rc.IsOk()); row_count++; } ASSERT_EQ(row_count, 3); } TEST_F(MindDataTestCSVOp, TestTotalRows) { std::string csv_file1 = datasets_root_path_ + "/testCSV/1.csv"; std::string csv_file2 = datasets_root_path_ + "/testCSV/size.csv"; std::vector files; files.push_back(csv_file1); int64_t total_rows = 0; CsvOp::CountAllFileRows(files, false, &total_rows); ASSERT_EQ(total_rows, 3); files.clear(); files.push_back(csv_file2); CsvOp::CountAllFileRows(files, false, &total_rows); ASSERT_EQ(total_rows, 5); files.clear(); files.push_back(csv_file1); files.push_back(csv_file2); CsvOp::CountAllFileRows(files, false, &total_rows); ASSERT_EQ(total_rows, 8); files.clear(); }