update lite schema to support quantization-aware training of GPU

5 years ago · f9120e6886
parent 0a95223f25
commit f9120e6886
21 changed files with 816 additions and 130 deletions
--- a/mindspore/ccsrc/predict/converter/attr_utils/convert_util.h
+++ b/mindspore/ccsrc/predict/converter/attr_utils/convert_util.h
@ -36,7 +36,6 @@ using GraphDefT = mindspore::predict::GraphDefT;
 using TensorDefT = mindspore::predict::TensorDefT;
 using SubGraphDefT = mindspore::predict::SubGraphDefT;
 using SubGraphPtr = std::unique_ptr<mindspore::predict::SubGraphDefT>;
-using NodeDef = mindspore::predict::NodeDefT;
 using MsDataType = mindspore::predict::DataType;
 using MsFormat = mindspore::predict::Format;
 using MsKernelKey = void *;
--- a/mindspore/ccsrc/predict/converter/kernel2ms.cc
+++ b/mindspore/ccsrc/predict/converter/kernel2ms.cc
@ -108,8 +108,7 @@ bool Kernel2Ms::SetGraphOutputIdx(const KernelGraphPtr &kernel_graph_ptr, const
 }

 bool Kernel2Ms::SetOpOutputIdx(const CNodePtr &c_node_ptr, const TensorPtr &output_tensor,
-                               const TensorCachePtr &tensor_cache, int ref_count, size_t order_index,
-                               NodeDef *ms_node) {
+                               const TensorCachePtr &tensor_cache, int ref_count, size_t order_index, OpDefT *ms_node) {
  MS_EXCEPTION_IF_NULL(c_node_ptr);
  MS_EXCEPTION_IF_NULL(output_tensor);
  MS_EXCEPTION_IF_NULL(ms_node);
@ -123,7 +122,7 @@ bool Kernel2Ms::SetOpOutputIdx(const CNodePtr &c_node_ptr, const TensorPtr &outp
  std::vector<int> tensor_shape;
  (void)std::transform(host_shape.begin(), host_shape.end(), std::back_inserter(tensor_shape), SizeToInt);
  int outputIndex = tensor_cache->addExTensor(tensor_key, output_tensor, ref_count, tensor_shape, KERNEL);
-  ms_node->opDef->outputIndex.push_back(outputIndex);
+  ms_node->outputIndex.push_back(outputIndex);
  return true;
 }

@ -164,7 +163,7 @@ void Kernel2Ms::GetRealInpoutsPtr(const AnfNodePtr &node, std::vector<AnfNodePtr
  }
 }

-bool Kernel2Ms::SetOpInputIdx(const CNodePtr &c_node_ptr, const TensorCachePtr &tensor_cache, NodeDef *ms_node) {
+bool Kernel2Ms::SetOpInputIdx(const CNodePtr &c_node_ptr, const TensorCachePtr &tensor_cache, OpDefT *ms_node) {
  MS_EXCEPTION_IF_NULL(c_node_ptr);
  MS_EXCEPTION_IF_NULL(tensor_cache);
  MS_EXCEPTION_IF_NULL(ms_node);
@ -184,7 +183,7 @@ bool Kernel2Ms::SetOpInputIdx(const CNodePtr &c_node_ptr, const TensorCachePtr &
      }
      ExTensorPtr ex_tensor_ptr = ex_tensor_list[real_output_idx[j]];
      ex_tensor_list.clear();
-      ms_node->opDef->inputIndex.push_back(ex_tensor_ptr->index_);
+      ms_node->inputIndex.push_back(ex_tensor_ptr->index_);
    }
  }
  return true;
@ -397,19 +396,18 @@ bool Kernel2Ms::SetGraphOpTensors(const KernelGraphPtr &kernel_graph_ptr, const
      return false;
    }
    auto kernel_key = node_indexs_[kernel.get()];
-    std::unique_ptr<NodeDef> ms_node(new NodeDef);
+    std::unique_ptr<OpDefT> ms_node(new OpDefT);
+    ms_node->name = kernel->fullname_with_scope();
    ms_node->fmkType = mindspore::predict::FmkType_CAFFE;
-    std::unique_ptr<OpDefT> ms_op(new OpDefT());
    auto c_name = AnfAlgo::GetCNodeName(kernel);
    auto fun = predict::convert::OpAttrFactory::GetInstance()->GetPackFun(c_name);
    if (fun == nullptr) {
      MS_LOG(ERROR) << "get node [" << kernel->fullname_with_scope() << "] attr failed.";
      return false;
-    } else if (!fun(kernel, ms_op.get())) {
+    } else if (!fun(kernel, ms_node.get())) {
      MS_LOG(ERROR) << "set node [" << kernel->fullname_with_scope() << "] attr failed.";
      return false;
    }
-    ms_node->opDef = std::move(ms_op);
    auto output_size = AnfAlgo::GetOutputTensorNum(kernel);
    int nodeRefCount = SizeToInt(output_size);
    for (size_t j = 0; j < output_size; ++j) {
@ -466,7 +464,7 @@ bool Kernel2Ms::KernelGraph2MsGraph(const KernelGraphPtr &kernel_graph_ptr) {
    if (!SetOpInputIdx(kernels[i], tensor_cache_ptr_, ms_node)) {
      return false;
    }
-    std::unique_ptr<NodeDef> ms_node_tmp(ms_node);
+    std::unique_ptr<OpDefT> ms_node_tmp(ms_node);
    sub_ms_graph->nodes.emplace_back(std::move(ms_node_tmp));
  }
  if (!SetAllTensors(tensor_cache_ptr_, sub_ms_graph.get())) {
--- a/mindspore/ccsrc/predict/converter/kernel2ms.h
+++ b/mindspore/ccsrc/predict/converter/kernel2ms.h
@ -64,10 +64,10 @@ class Kernel2Ms {

  bool SetAllTensors(const TensorCachePtr &tensor_cache, SubGraphDefT *sub_graph_def_t);

-  bool SetOpInputIdx(const CNodePtr &c_node_ptr, const TensorCachePtr &tensor_cache, NodeDef *ms_node);
+  bool SetOpInputIdx(const CNodePtr &c_node_ptr, const TensorCachePtr &tensor_cache, OpDefT *ms_node);

  bool SetOpOutputIdx(const CNodePtr &c_node_ptr, const TensorPtr &output_tensor, const TensorCachePtr &tensor_cache,
-                      int ref_count, size_t order_index, NodeDef *ms_node);
+                      int ref_count, size_t order_index, OpDefT *ms_node);

  bool SetGraphOutputIdx(const KernelGraphPtr &kernel_graph_ptr, const TensorCachePtr &tensor_cache,
                         SubGraphDefT *sub_graph_def_t, AllOutputTensors *all_output_tensors);
@ -102,7 +102,7 @@ class Kernel2Ms {
  bool SetMemResue() const;
  SubGraphPtr sub_ms_graph_;
  AllOutputTensors all_output_tensors_;
-  std::vector<NodeDef *> tmp_op_nodes_;
+  std::vector<OpDefT *> tmp_op_nodes_;
  std::unordered_map<MsKernelKey, int> node_indexs_;
  std::unordered_map<int, MsKernelKey> index_nodes_;
  int graph_index_ = 0;
--- a/mindspore/ccsrc/predict/converter/lite_model/op_attr_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/op_attr_packer.cc
@ -33,6 +33,14 @@ bool CastPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
 bool MeanPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
 bool SoftmaxPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
 bool ScalePacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool AddFoldPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool ArgMaxPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool BatchNormFoldPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool FakeQuantWithMinMaxPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool FakeQuantWithMinMaxPerChannelPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool MulPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool MulFoldPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);
+bool SqueezePacker(const CNodePtr &c_node_ptr, OpDefT *ms_op);

 OpAttrFactory::OpAttrFactory() {
  pack_funs_ = {{"Conv2D", Conv2dPacker},
@ -60,23 +68,31 @@ OpAttrFactory::OpAttrFactory() {
                {"TensorAdd", AddPacker},
                {"SoftMax", SoftmaxPacker},
                {"SimpleMean", MeanPacker},
-                {"Scale", ScalePacker}};
+                {"ReduceMean", MeanPacker},
+                {"AddFold", AddFoldPacker},
+                {"ArgMax", ArgMaxPacker},
+                {"BatchNorm", BatchNormFoldPacker},
+                {"FakeQuantWithMinMax", FakeQuantWithMinMaxPacker},
+                {"FakeQuantWithMinMaxPerChannel", FakeQuantWithMinMaxPerChannelPacker},
+                {"Mul", MulPacker},
+                {"MulFold", MulFoldPacker},
+                {"Squeeze", SqueezePacker}};
 }
 OpAttrPackFun OpAttrFactory::GetPackFun(const std::string &opType) {
  if (pack_funs_.find(opType) == pack_funs_.end()) {
-    MS_LOG(ERROR) << "Op Attr pack fun  [\" << opType << \"] not found.";
+    MS_LOG(WARNING) << "Op Attr pack fun  [" << opType << "] not found.";
    return nullptr;
  }
  return pack_funs_[opType];
 }

-mindspore::predict::DataFormatType GetAttrFormat(const std::string &format) {
+mindspore::predict::Format GetAttrFormat(const std::string &format) {
  if (format == kOpFormat_NCHW) {
-    return predict::DataFormatType::DataFormatType_NCHW;
+    return predict::Format::Format_NCHW;
  } else if (format == kOpFormat_NHWC) {
-    return predict::DataFormatType::DataFormatType_NHWC;
+    return predict::Format::Format_NHWC;
  } else {
-    return predict::DataFormatType::DataFormatType_UNKNOW;
+    return predict::Format::Format_NUM_OF_FORMAT;
  }
 }

--- a/mindspore/ccsrc/predict/converter/lite_model/op_attr_packer.h
+++ b/mindspore/ccsrc/predict/converter/lite_model/op_attr_packer.h
@ -48,7 +48,7 @@ class OpAttrFactory {
  std::unordered_map<std::string, OpAttrPackFun> pack_funs_;
 };

-mindspore::predict::DataFormatType GetAttrFormat(const std::string &format);
+mindspore::predict::Format GetAttrFormat(const std::string &format);

 mindspore::predict::PadMode GetAttrPadMode(const std::string &pad_mode);
 }  // namespace convert
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/add_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/add_packer.cc
@ -25,7 +25,6 @@ bool AddPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
  }
  std::unique_ptr<AddT> attr(new AddT());
  MS_EXCEPTION_IF_NULL(attr);
-  attr->format = predict::DataFormatType::DataFormatType_NCHW;
  ms_op->name = c_node_ptr->fullname_with_scope();
  ms_op->attr.type = OpT_Add;
  ms_op->attr.value = attr.release();
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/addfold_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/addfold_packer.cc
@ -0,0 +1,34 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool AddFoldPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<AddFoldT> attr(new AddFoldT());
+  MS_EXCEPTION_IF_NULL(attr);
+  ms_op->attr.type = OpT_AddFold;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/argmax_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/argmax_packer.cc
@ -0,0 +1,34 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool ArgMaxPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<ArgMaxT> attr(new ArgMaxT());
+  MS_EXCEPTION_IF_NULL(attr);
+  ms_op->attr.type = OpT_ArgMax;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/batchnormfold_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/batchnormfold_packer.cc
@ -0,0 +1,34 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool BatchNormFoldPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<BatchNormFoldT> attr(new BatchNormFoldT());
+  MS_EXCEPTION_IF_NULL(attr);
+  ms_op->attr.type = OpT_BatchNormFold;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/fakequantwithminmax_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/fakequantwithminmax_packer.cc
@ -0,0 +1,34 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool FakeQuantWithMinMaxPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<FakeQuantWithMinMaxT> attr(new FakeQuantWithMinMaxT());
+  MS_EXCEPTION_IF_NULL(attr);
+  ms_op->attr.type = OpT_FakeQuantWithMinMax;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/fakequantwithminmaxperchannel_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/fakequantwithminmaxperchannel_packer.cc
@ -0,0 +1,34 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool FakeQuantWithMinMaxPerChannelPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<FakeQuantWithMinMaxPerChannelT> attr(new FakeQuantWithMinMaxPerChannelT());
+  MS_EXCEPTION_IF_NULL(attr);
+  ms_op->attr.type = OpT_FakeQuantWithMinMaxPerChannel;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/mul_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/mul_packer.cc
@ -0,0 +1,34 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool MulPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<MulT> attr(new MulT());
+  MS_EXCEPTION_IF_NULL(attr);
+  ms_op->attr.type = OpT_Mul;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/mulflod_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/mulflod_packer.cc
@ -0,0 +1,35 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool MulFoldPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<MulFoldT> attr(new MulFoldT());
+  MS_EXCEPTION_IF_NULL(attr);
+  ms_op->name = c_node_ptr->fullname_with_scope();
+  ms_op->attr.type = OpT_MulFold;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/pooling_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/pooling_packer.cc
@ -36,7 +36,6 @@ bool PoolingPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
    attr->poolingMode = mindspore::predict::PoolMode::PoolMode_MEAN_POOLING;
  } else if (c_name == "GlobalPool") {
    ms_op->name = c_node_ptr->fullname_with_scope();
-    attr->poolingMode = mindspore::predict::PoolMode::PoolMode_GLOBAL_POOING;
  } else {
    MS_LOG(ERROR) << "unknowed pooling type.";
    return false;
@ -53,7 +52,6 @@ bool PoolingPacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
  attr->padDown = 0;
  attr->padLeft = 0;
  attr->padRight = 0;
-  attr->caffeMode = false;
  ms_op->attr.type = OpT_Pooling;
  ms_op->attr.value = attr.release();
  return true;
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/reshape_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/reshape_packer.cc
@ -25,7 +25,7 @@ bool ReshapePacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
  }
  std::unique_ptr<ReshapeT> attr(new ReshapeT());
  MS_EXCEPTION_IF_NULL(attr);
-  attr->format = predict::DataFormatType::DataFormatType_NCHW;
+  attr->format = predict::Format::Format_NCHW;
  ms_op->name = c_node_ptr->fullname_with_scope();
  ms_op->attr.type = OpT_Reshape;
  ms_op->attr.value = attr.release();
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/scale_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/scale_packer.cc
@ -25,7 +25,7 @@ bool ScalePacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
  }
  std::unique_ptr<ScaleT> attr(new ScaleT());
  MS_EXCEPTION_IF_NULL(attr);
-  attr->format = predict::DataFormatType::DataFormatType_NCHW;
+  attr->format = predict::Format::Format_NCHW;
  ms_op->name = c_node_ptr->fullname_with_scope();
  ms_op->attr.type = OpT_Scale;
  ms_op->attr.value = attr.release();
--- a/mindspore/ccsrc/predict/converter/lite_model/operations/squeeze_packer.cc
+++ b/mindspore/ccsrc/predict/converter/lite_model/operations/squeeze_packer.cc
@ -0,0 +1,38 @@
+/**
+ * Copyright 2020 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "predict/converter/lite_model/op_attr_packer.h"
+
+namespace mindspore {
+namespace predict {
+namespace convert {
+bool SqueezePacker(const CNodePtr &c_node_ptr, OpDefT *ms_op) {
+  if (c_node_ptr == nullptr || ms_op == nullptr) {
+    return false;
+  }
+  std::unique_ptr<SqueezeT> attr(new SqueezeT());
+  MS_EXCEPTION_IF_NULL(attr);
+
+  std::vector<int> kernel_axis_value = AnfAlgo::GetNodeAttr<std::vector<int>>(c_node_ptr, "axis");
+  attr->axis = kernel_axis_value;
+
+  ms_op->attr.type = OpT_Squeeze;
+  ms_op->attr.value = attr.release();
+  return true;
+}
+}  // namespace convert
+}  // namespace predict
+}  // namespace mindspore
--- a/mindspore/ccsrc/predict/predict.cc
+++ b/mindspore/ccsrc/predict/predict.cc
@ -22,7 +22,7 @@

 namespace mindspore {
 namespace predictmodel {
-void StepConvertGraph(const KernelGraphPtrNew &kernel_graph_ptr) {
+void StepConvertGraph(const KernelGraphPtr &kernel_graph_ptr) {
  MS_LOG(INFO) << "start convert_graph step";
  // get kernel_graph. this graph can be origin or device, depends on which steps to persistence
  MS_EXCEPTION_IF_NULL(kernel_graph_ptr);
@ -59,15 +59,5 @@ void StepConvertWeight(const std::vector<tensor::TensorPtr> &inputs) {
    }
  }
 }
-
-executor::TargetMode GetDeviceTarget(const std::string &device_target) {
-  if (device_target == "GPU") {
-    return executor::kGPUTarget;
-  } else if (device_target == "Ascend") {
-    return executor::kCPUTarget;
-  } else {
-    return executor::kUnknowTarget;
-  }
-}
 }  // namespace predictmodel
 }  // namespace mindspore
--- a/mindspore/ccsrc/predict/predict.h
+++ b/mindspore/ccsrc/predict/predict.h
@ -19,16 +19,14 @@

 #include <memory>
 #include <vector>
-#include <string>
 #include "session/session_basic.h"
 #include "predict/converter/kernel2ms.h"

 namespace mindspore {
 namespace predictmodel {
-using KernelGraphPtrNew = std::shared_ptr<mindspore::session::KernelGraph>;
-void StepConvertGraph(const KernelGraphPtrNew &kernel_graph_ptr);
+using KernelGraphPtr = std::shared_ptr<mindspore::session::KernelGraph>;
+void StepConvertGraph(const KernelGraphPtr &kernel_graph_ptr);
 void StepConvertWeight(const std::vector<tensor::TensorPtr> &inputs);
-executor::TargetMode GetDeviceTarget(const std::string &device_target);
 }  // namespace predictmodel
 }  // namespace mindspore
 #endif  // MINDSPORE_MINDSPORE_CCSRC_PREDICT_H_
--- a/mindspore/ccsrc/predict/schema/ms.fbs
+++ b/mindspore/ccsrc/predict/schema/ms.fbs
@ -13,42 +13,26 @@
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
- 
+
 include "op.fbs";

 namespace mindspore.predict;

-enum DataType : int {
-  DT_FLOAT = 0,
-  DT_FLOAT16 = 1,
-  DT_INT8 = 2,
-  DT_INT32 = 3,
-  DT_UINT8 = 4,
-  DT_UINT32 = 8,
-  DT_UNDEFINED = 16
-}
-
-enum Format : int {
-    NCHW = 0,
-    NHWC,
-    NC4HW4 = 100,
-    NUM_OF_FORMAT
-}
-
-enum MSConst: int {
+enum MSCONST: int {
    WEIGHT_REFCOUNT = 999
 }

-table QuantizationDef {
-    // Quantized value q, corresponding float value r:
-    // r = scale * (q - zero_point), where scale = (rmax - rmin) / (qmax - qmin)
-    min: [float];
-    max: [float];
-    scale: [float];
-    zero_point: [long];
+table QuantParam {
+    scale: double;
+    zeroPoint: int;
+    min: double = 0;
+    max: double = 0;
+    narrowRange: bool = true;
+    numBits: int = 8;
+}

-    // Tensor shape of the specifies dimension.
-    dimension: int;
+table QuantParamArray {
+    param: [QuantParam];  //pre-channel
 }

 table TensorDef {
@ -60,7 +44,6 @@ table TensorDef {
    refCount: int;
    offset: int;
    data: [ubyte];
-    quantization: QuantizationDef;
 }

 union OpT {
@ -70,7 +53,6 @@ union OpT {
    Conv2D,
    FusedBatchNorm,
    CaffeBatchNorm,
-    Squeeze,
    BiasAdd,
    Pooling,
    DepthwiseConv2D,
@ -85,57 +67,134 @@ union OpT {
    Eltwise,
    NetOutput,
    Add,
+    Sub,
    MatMul,
    StridedSlice,
    Power,
    Slice,
    Stack,
    Mul,
+    RealDiv,
    Pad,
    Maximum,
+    Minimum,
    CaffePReLU,
+    LeakyReLU,
    ArgMax,
+    ArgMin,
    Exp,
    CaffeCrop,
    Range,
+    Rsqrt,
    ExpandDims,
    Tile,
-    Cast
-//    Split
+    Cast,
+    Shape,
+    Nchw2Nhwc,
+    Nhwc2Nchw,
+    QuantDTypeCast,
+    Split,
+    Permute,
+    FakeQuantWithMinMaxVars,
+    Equal,
+    Less,
+    Greater,
+    Min,
+    Floor,
+    Abs,
+    Neg,
+    Cos,
+    Sin,
+    Sqrt,
+    Square,
+    Constant,
+    Log,
+    Tan,
+    Atan,
+    Asin,
+    Clip,
+    Transpose,
+    Squeeze,
+    Unsqueeze,
+    Upsample,
+    Dropout,
+    Broadcast,
+    Lrn,
+    Prelu,
+    ZerosLike,
+    TopK,
+    SpaceToDepth,
+    SpaceToBatch,
+    SparseToDense,
+    ReverseSequence,
+    Rank,
+    Gather,
+    GatherNd,
+    Fill,
+    Elu,
+    DepthToSpace,
+    BatchToSpace,
+    AddN,
+    Ceil,
+    EmbeddingLookup,
+    EmbeddingLookupSparse,
+    FloorDiv,
+    FloorMod,
+    L2Norm,
+    LocalResponseNormalization,
+    MatrixDiag,
+    Reduce,
+    Reverse,
+    Round,
+    Select,
+    Scatter,
+    Unique,
+    Unstack,
+    LogicalAnd,
+    LogicalOr,
+    LogicalXor,
+    LogicalNot,
+    OnnxInt8Quantize,
+    OnnxInt8Dequantize,
+    FakeQuantWithMinMax,
+    FakeQuantWithMinMaxPerChannel,
+    BatchNormFold,
+    MulFold,
+    AddFold,
+    SquaredDifference
 }

 enum QuantType: int {
    QUANT_NONE,
-    QUANT_INT8
+    AwareTrainning,
+    WeightQuant,
+    PostTraining
+}
+
+enum FmkType: int {
+    TF,
+    CAFFE,
+    ONNX,
+    MS,
+    TFLITE
 }

 table OpDef {
    name: string;
+    fmkType: FmkType;
    attr: OpT;
    inputIndex: [uint];
    outputIndex: [uint];
-    isLastConv: bool;
    quantType: QuantType = QUANT_NONE;
+    quantParam: [QuantParamArray];
 }

-
-enum FmkType: int {
-    TF,
-    CAFFE
-}
-
-table NodeDef {
-    fmkType: FmkType;
-    opDef: OpDef;
-}
-
-
 table SubGraphDef {
    name: string;
    inputIndex: [uint];
    outputIndex: [uint];
    mempoolSize: uint;
-    nodes: [NodeDef];
+    nodes: [OpDef];
    allTensors: [TensorDef]; // weight + input + output
 }

--- a/mindspore/ccsrc/predict/schema/op.fbs
+++ b/mindspore/ccsrc/predict/schema/op.fbs