You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
118 lines
3.6 KiB
118 lines
3.6 KiB
// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#pragma once
|
|
|
|
#include <map>
|
|
#include <memory>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
#include "paddle/fluid/framework/details/op_handle_base.h"
|
|
#include "paddle/fluid/framework/lod_tensor.h"
|
|
#include "paddle/fluid/framework/scope.h"
|
|
#include "paddle/fluid/framework/selected_rows.h"
|
|
#include "paddle/fluid/platform/device_context.h"
|
|
#if defined(PADDLE_WITH_CUDA) && !defined(_WIN32)
|
|
#include "paddle/fluid/platform/nccl_helper.h"
|
|
#endif
|
|
|
|
namespace paddle {
|
|
namespace framework {
|
|
namespace details {
|
|
struct CollectiveContext {
|
|
std::vector<std::string> endpoints_;
|
|
int trainer_id_{0};
|
|
|
|
std::string String() const {
|
|
std::stringstream ss;
|
|
ss << "endpoints_:";
|
|
for (auto e : endpoints_) {
|
|
ss << e << ",";
|
|
}
|
|
|
|
ss << "trainer_id_:" << trainer_id_;
|
|
|
|
return ss.str();
|
|
}
|
|
|
|
static CollectiveContext *GetInstance() {
|
|
std::call_once(init_flag_,
|
|
[&]() { context_.reset(new CollectiveContext()); });
|
|
return context_.get();
|
|
}
|
|
|
|
private:
|
|
static std::once_flag init_flag_;
|
|
static std::unique_ptr<CollectiveContext> context_;
|
|
};
|
|
|
|
struct ReduceOpHandle : public OpHandleBase {
|
|
std::vector<Scope *> local_scopes_;
|
|
std::vector<platform::Place> places_;
|
|
|
|
#if defined(PADDLE_WITH_CUDA) && !defined(_WIN32)
|
|
const platform::NCCLContextMap *nccl_ctxs_;
|
|
ReduceOpHandle(ir::Node *node, const std::vector<Scope *> &local_scopes,
|
|
const std::vector<platform::Place> &places,
|
|
const platform::NCCLContextMap *nccl_ctxs)
|
|
: OpHandleBase(node),
|
|
local_scopes_(local_scopes),
|
|
places_(places),
|
|
nccl_ctxs_(nccl_ctxs) {
|
|
if (nccl_ctxs_) {
|
|
for (auto &p_ctx : nccl_ctxs_->contexts_) {
|
|
this->SetDeviceContext(platform::CUDAPlace(p_ctx.first),
|
|
p_ctx.second.ctx_.get());
|
|
}
|
|
}
|
|
}
|
|
#else
|
|
ReduceOpHandle(ir::Node *node, const std::vector<Scope *> &local_scopes,
|
|
const std::vector<platform::Place> &places)
|
|
: OpHandleBase(node), local_scopes_(local_scopes), places_(places) {}
|
|
#endif
|
|
|
|
std::string Name() const override;
|
|
|
|
bool IsMultiDeviceTransfer() override { return true; };
|
|
|
|
protected:
|
|
void RunImpl() override;
|
|
|
|
std::vector<Scope *> GetLocalScopes() override { return local_scopes_; }
|
|
|
|
#if defined PADDLE_WITH_CUDA && defined PADDLE_WITH_DISTRIBUTE
|
|
template <typename DevCtx, typename DataType>
|
|
void GatherSelectedRows(
|
|
const std::vector<const SelectedRows *> &src_selecte_rows_,
|
|
const std::vector<platform::Place> &in_places,
|
|
const std::map<platform::Place, platform::DeviceContext *> &dev_ctxes,
|
|
VarHandle *out_var_handle, const platform::Place &out_place,
|
|
SelectedRows *dst_selecte_rows);
|
|
#endif
|
|
|
|
void Wait(
|
|
const std::map<platform::Place, platform::DeviceContext *> &dev_ctxes);
|
|
|
|
template <typename T>
|
|
std::vector<const T *> GetInputValues(
|
|
const std::vector<VarHandle *> &in_var_handles,
|
|
const std::vector<Scope *> &var_scopes) const;
|
|
};
|
|
|
|
} // namespace details
|
|
} // namespace framework
|
|
} // namespace paddle
|