|
|
|
@ -354,13 +354,15 @@ void SetCastAndWeightFormat(const CNodePtr &kernel_node) {
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void SetWeightFormat(const AnfNodePtr &real_input_node, const std::vector<string> &output_format,
|
|
|
|
|
const CNodePtr &kernel_node, size_t input_index) {
|
|
|
|
|
const CNodePtr &kernel_node, size_t input_index, bool force_fresh = false) {
|
|
|
|
|
if (real_input_node->isa<CNode>() || AnfAlgo::OutputAddrExist(real_input_node, 0)) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
auto builder = std::make_shared<kernel::KernelBuildInfo::KernelBuildInfoBuilder>();
|
|
|
|
|
// we set special device info of a input tensor.
|
|
|
|
|
bool is_ref = false;
|
|
|
|
|
auto op_info = kernel::tbe::TbeDynamicShapeUtil::FindOp(AnfAlgo::GetCNodeName(kernel_node), kernel_node);
|
|
|
|
|
if (op_info != nullptr) {
|
|
|
|
|
is_ref = op_info->is_ref();
|
|
|
|
|
force_fresh = op_info->is_ref() || force_fresh;
|
|
|
|
|
}
|
|
|
|
|
auto selected_kernel_info = AnfAlgo::GetSelectKernelBuildInfo(kernel_node);
|
|
|
|
|
if (IsValueNode<tensor::Tensor>(real_input_node) &&
|
|
|
|
@ -371,7 +373,7 @@ void SetWeightFormat(const AnfNodePtr &real_input_node, const std::vector<string
|
|
|
|
|
AnfAlgo::SetSelectKernelBuildInfo(builder->Build(), real_input_node.get());
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
if (AnfAlgo::GetOutputDeviceDataType(real_input_node, 0) == kTypeUnknown || is_ref) {
|
|
|
|
|
if (AnfAlgo::GetOutputDeviceDataType(real_input_node, 0) == kTypeUnknown || force_fresh) {
|
|
|
|
|
builder->SetOutputsFormat(output_format);
|
|
|
|
|
std::vector<TypeId> output_type = {AnfAlgo::GetOutputInferDataType(real_input_node, 0)};
|
|
|
|
|
builder->SetOutputsDeviceType(output_type);
|
|
|
|
@ -381,6 +383,9 @@ void SetWeightFormat(const AnfNodePtr &real_input_node, const std::vector<string
|
|
|
|
|
|
|
|
|
|
bool RefreshCastAndParamWeightFormat(const AnfNodePtr &input_node, const string &format) {
|
|
|
|
|
MS_EXCEPTION_IF_NULL(input_node);
|
|
|
|
|
if (MsContext::GetInstance()->get_param<int>(MS_CTX_EXECUTION_MODE) == kPynativeMode) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
if (!input_node->isa<CNode>()) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
@ -397,7 +402,7 @@ bool RefreshCastAndParamWeightFormat(const AnfNodePtr &input_node, const string
|
|
|
|
|
info_builder->SetOutputsFormat({format});
|
|
|
|
|
AnfAlgo::SetSelectKernelBuildInfo(info_builder->Build(), cast_node.get());
|
|
|
|
|
auto cast_input_node = AnfAlgo::VisitKernel(AnfAlgo::GetInputNode(cast_node, 0), 0);
|
|
|
|
|
SetWeightFormat(cast_input_node.first, {format}, cast_node, 0);
|
|
|
|
|
SetWeightFormat(cast_input_node.first, {format}, cast_node, 0, true);
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
} // namespace
|
|
|
|
@ -418,9 +423,6 @@ void SetTensorDeviceInfo(const CNodePtr &kernel_node) {
|
|
|
|
|
if (real_input_node->isa<Parameter>() && !AnfAlgo::IsParameterWeight(real_input_node->cast<ParameterPtr>())) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
if (AnfAlgo::OutputAddrExist(real_input_node, 0)) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
auto refresh_format = selected_kernel_info->GetInputFormat(input_index);
|
|
|
|
|
std::vector<std::string> output_format = {refresh_format};
|
|
|
|
|
// if not find in host convert format map means the host has not registered the convert function of this format
|
|
|
|
|