parent
316765839d
commit
9da7b33515
@ -1,106 +1 @@
|
||||
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
|
||||
|
||||
Licensed under the Apache License, Version 2.0 (the "License");
|
||||
you may not use this file except in compliance with the License.
|
||||
You may obtain a copy of the License at
|
||||
|
||||
http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
Unless required by applicable law or agreed to in writing, software
|
||||
distributed under the License is distributed on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
See the License for the specific language governing permissions and
|
||||
limitations under the License. */
|
||||
|
||||
#include "paddle/fluid/framework/data_type_transform.h"
|
||||
|
||||
#include "paddle/fluid/framework/selected_rows.h"
|
||||
#include "paddle/fluid/platform/transform.h"
|
||||
|
||||
namespace paddle {
|
||||
namespace framework {
|
||||
|
||||
template <typename InType, typename OutType>
|
||||
struct CastDataTypeFunctor {
|
||||
HOSTDEVICE inline OutType operator()(InType in) const {
|
||||
return static_cast<OutType>(in);
|
||||
}
|
||||
};
|
||||
|
||||
template <typename InType>
|
||||
struct CastDataType {
|
||||
CastDataType(const framework::Tensor& in, framework::Tensor* out,
|
||||
const platform::DeviceContext* ctx)
|
||||
: in_(in), out_(out), ctx_(ctx) {}
|
||||
const framework::Tensor in_;
|
||||
framework::Tensor* out_;
|
||||
const platform::DeviceContext* ctx_;
|
||||
|
||||
template <typename OutType>
|
||||
void apply() {
|
||||
auto* in_begin = in_.data<InType>();
|
||||
auto* in_end = in_begin + in_.numel();
|
||||
auto* out_begin = out_->mutable_data<OutType>(in_.place());
|
||||
|
||||
if (platform::is_cpu_place(in_.place())) {
|
||||
platform::Transform<platform::CPUDeviceContext> trans;
|
||||
auto* context = static_cast<const platform::CPUDeviceContext*>(ctx_);
|
||||
trans(*context, in_begin, in_end, out_begin,
|
||||
CastDataTypeFunctor<InType, OutType>());
|
||||
#ifdef __NVCC__
|
||||
} else if (platform::is_gpu_place(in_.place())) {
|
||||
platform::Transform<platform::CUDADeviceContext> trans;
|
||||
auto* context = static_cast<const platform::CUDADeviceContext*>(ctx_);
|
||||
trans(*context, in_begin, in_end, out_begin,
|
||||
CastDataTypeFunctor<InType, OutType>());
|
||||
context->Wait();
|
||||
#endif
|
||||
} else {
|
||||
PADDLE_THROW("Unsupported place!");
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
void TransDataType(const OpKernelType& kernel_type_for_var,
|
||||
const OpKernelType& expected_kernel_type, const Tensor& in,
|
||||
Tensor* out) {
|
||||
platform::DeviceContextPool& pool = platform::DeviceContextPool::Instance();
|
||||
|
||||
out->Resize(in.dims());
|
||||
auto src_type = kernel_type_for_var.data_type_;
|
||||
auto dst_type = expected_kernel_type.data_type_;
|
||||
auto ctx = pool.Get(in.place());
|
||||
|
||||
switch (src_type) {
|
||||
case proto::VarType::FP16:
|
||||
framework::VisitDataType(dst_type,
|
||||
CastDataType<platform::float16>(in, out, ctx));
|
||||
break;
|
||||
case proto::VarType::FP32:
|
||||
framework::VisitDataType(dst_type, CastDataType<float>(in, out, ctx));
|
||||
break;
|
||||
case proto::VarType::FP64:
|
||||
framework::VisitDataType(dst_type, CastDataType<double>(in, out, ctx));
|
||||
break;
|
||||
case proto::VarType::INT32:
|
||||
framework::VisitDataType(dst_type, CastDataType<int>(in, out, ctx));
|
||||
break;
|
||||
case proto::VarType::INT64:
|
||||
framework::VisitDataType(dst_type, CastDataType<int64_t>(in, out, ctx));
|
||||
break;
|
||||
case proto::VarType::BOOL:
|
||||
framework::VisitDataType(dst_type, CastDataType<bool>(in, out, ctx));
|
||||
break;
|
||||
case proto::VarType::INT16:
|
||||
framework::VisitDataType(dst_type, CastDataType<bool>(in, out, ctx));
|
||||
break;
|
||||
case proto::VarType::UINT8:
|
||||
framework::VisitDataType(dst_type, CastDataType<bool>(in, out, ctx));
|
||||
break;
|
||||
default:
|
||||
PADDLE_THROW("Not support type %d", src_type);
|
||||
}
|
||||
}
|
||||
|
||||
} // namespace framework
|
||||
} // namespace paddle
|
||||
data_type_transform.cc
|
File diff suppressed because it is too large
Load Diff
Loading…
Reference in new issue