You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
96 lines
3.5 KiB
96 lines
3.5 KiB
/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License. */
|
|
|
|
#pragma once
|
|
|
|
#include <stdint.h>
|
|
#include <fstream>
|
|
#include <numeric>
|
|
#include <sstream>
|
|
#include <string>
|
|
|
|
#include "paddle/fluid/framework/data_type.h"
|
|
#include "paddle/fluid/framework/data_type_transform.h"
|
|
#include "paddle/fluid/framework/framework.pb.h"
|
|
#include "paddle/fluid/framework/lod_tensor.h"
|
|
#include "paddle/fluid/framework/op_registry.h"
|
|
#include "paddle/fluid/platform/device_context.h"
|
|
#include "paddle/fluid/platform/port.h"
|
|
|
|
namespace paddle {
|
|
namespace operators {
|
|
template <typename DeviceContext, typename T>
|
|
class SaveCombineOpKernel : public framework::OpKernel<T> {
|
|
public:
|
|
void Compute(const framework::ExecutionContext &ctx) const override {
|
|
auto place = ctx.GetPlace();
|
|
auto filename = ctx.Attr<std::string>("file_path");
|
|
auto overwrite = ctx.Attr<bool>("overwrite");
|
|
auto save_as_fp16 = ctx.Attr<bool>("save_as_fp16");
|
|
|
|
bool is_present = FileExists(filename);
|
|
if (is_present && !overwrite) {
|
|
PADDLE_THROW("%s exists!, cannot save_combine to it when overwrite=false",
|
|
filename, overwrite);
|
|
}
|
|
|
|
MkDirRecursively(DirName(filename).c_str());
|
|
std::ofstream fout(filename, std::ios::binary);
|
|
PADDLE_ENFORCE(static_cast<bool>(fout), "Cannot open %s to write",
|
|
filename);
|
|
|
|
auto &inp_var_names = ctx.Inputs("X");
|
|
auto &inp_vars = ctx.MultiInputVar("X");
|
|
PADDLE_ENFORCE_GT(static_cast<int>(inp_var_names.size()), 0,
|
|
"The number of input variables should be greater than 0");
|
|
|
|
// get device context from pool
|
|
platform::DeviceContextPool &pool = platform::DeviceContextPool::Instance();
|
|
auto &dev_ctx = *pool.Get(place);
|
|
|
|
for (size_t i = 0; i < inp_var_names.size(); i++) {
|
|
PADDLE_ENFORCE(inp_vars[i] != nullptr,
|
|
"Cannot find variable %s for save_combine_op",
|
|
inp_var_names[i]);
|
|
PADDLE_ENFORCE(inp_vars[i]->IsType<framework::LoDTensor>(),
|
|
"SaveCombineOp only supports LoDTensor, %s has wrong type",
|
|
inp_var_names[i]);
|
|
|
|
auto &tensor = inp_vars[i]->Get<framework::LoDTensor>();
|
|
// Serialize tensors one by one
|
|
|
|
// Check types to see if a fp16 transformation is required
|
|
auto in_dtype = tensor.type();
|
|
auto out_dtype =
|
|
save_as_fp16 ? framework::proto::VarType::FP16 : in_dtype;
|
|
|
|
if (in_dtype != out_dtype) {
|
|
auto in_kernel_type = framework::OpKernelType(in_dtype, place);
|
|
auto out_kernel_type = framework::OpKernelType(out_dtype, place);
|
|
framework::LoDTensor out;
|
|
// copy LoD info to the new tensor
|
|
out.set_lod(tensor.lod());
|
|
framework::TransDataType(in_kernel_type, out_kernel_type, tensor, &out);
|
|
framework::SerializeToStream(fout, out, dev_ctx);
|
|
} else {
|
|
framework::SerializeToStream(fout, tensor, dev_ctx);
|
|
}
|
|
}
|
|
fout.close();
|
|
}
|
|
};
|
|
|
|
} // namespace operators
|
|
} // namespace paddle
|