You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
Paddle/paddle/fluid/inference/tensorrt/convert/convert.h

65 lines
2.0 KiB

/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
#pragma once
#include <NvInfer.h>
#include <functional>
#include <string>
#include <unordered_map>
#include "paddle/fluid/framework/block_desc.h"
#include "paddle/fluid/framework/scope.h"
namespace paddle {
namespace inference {
namespace tensorrt {
class TensorRTConverter {
public:
explicit TensorRTConverter(const framework::Scope& scope) : scope_(scope) {
this->RegisterOpConverters();
}
// convert fluid op to tensorrt layer
void ConvertOp(const framework::OpDesc& op);
// convert fluid block to tensorrt network
void ConvertBlock(const framework::BlockDesc& block);
private:
// convert op registry, whose key is the fluid op type, and value is the
// convert tensorrt function name
std::unordered_map<std::string, std::function<void(const framework::OpDesc&)>>
op_registry_;
// fluid inference scope
const framework::Scope& scope_;
// tensorrt input/output tensor list, whose key is the fluid variable name,
// and value is the pointer position of tensorrt tensor
std::unordered_map<std::string, nvinfer1::ITensor*> tr_tensors_;
// register different op converters
void RegisterOpConverters();
// convert a fluid Mul op to tensorrt fc layer without bias
static void ConvertMul(const framework::OpDesc& op);
// convert a fluid Conv2d op to tensorrt conv layer without bias
static void ConvertConv2D(const framework::OpDesc& op);
};
} // namespace tensorrt
} // namespace inference
} // namespace paddle