You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
62 lines
2.3 KiB
62 lines
2.3 KiB
// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#include "paddle/fluid/operators/impl/load_combine.h"
|
|
|
|
namespace paddle {
|
|
namespace operators {
|
|
namespace impl {
|
|
|
|
void LoadParamsFromStream(const std::vector<std::string> &out_var_names,
|
|
const paddle::platform::Place &place,
|
|
bool load_as_fp16, std::istream *buffer,
|
|
const paddle::framework::Scope *scope) {
|
|
auto *dev_ctx = platform::DeviceContextPool::Instance().Get(place);
|
|
for (size_t i = 0; i < out_var_names.size(); i++) {
|
|
auto *out_var = scope->FindVar(out_var_names[i]);
|
|
|
|
PADDLE_ENFORCE(out_var != nullptr, "Output variable %s cannot be found",
|
|
out_var_names[i]);
|
|
|
|
auto *tensor = out_var->GetMutable<framework::LoDTensor>();
|
|
|
|
// Get data from fin to tensor
|
|
DeserializeFromStream(*buffer, tensor, *dev_ctx);
|
|
|
|
auto in_dtype = framework::ToDataType(tensor->type());
|
|
auto out_dtype = load_as_fp16 ? framework::proto::VarType::FP16 : in_dtype;
|
|
|
|
if (in_dtype != out_dtype) {
|
|
// convert to float16 tensor
|
|
auto in_kernel_type = framework::OpKernelType(in_dtype, place);
|
|
auto out_kernel_type = framework::OpKernelType(out_dtype, place);
|
|
framework::LoDTensor fp16_tensor;
|
|
// copy LoD info to the new tensor
|
|
fp16_tensor.set_lod(tensor->lod());
|
|
framework::TransDataType(in_kernel_type, out_kernel_type, *tensor,
|
|
&fp16_tensor);
|
|
|
|
// reset output tensor
|
|
out_var->Clear();
|
|
tensor = out_var->GetMutable<framework::LoDTensor>();
|
|
tensor->set_lod(fp16_tensor.lod());
|
|
tensor->ShareDataWith(fp16_tensor);
|
|
}
|
|
}
|
|
}
|
|
|
|
} // namespace impl
|
|
} // namespace operators
|
|
} // namespace paddle
|