Paddle/paddle/fluid/platform/device_context.cc

/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
#include "paddle/fluid/platform/device_context.h"

#include <string>
#include <unordered_set>
#include <vector>

#include "paddle/fluid/memory/memory.h"

namespace paddle {
namespace platform {

DeviceContextPool* DeviceContextPool::pool = nullptr;

platform::DeviceContext* DeviceContextPool::Get(const platform::Place& place) {
  auto it = device_contexts_.find(place);
  if (it == device_contexts_.end()) {
    PADDLE_THROW(
        "'Place' is not supported, Please re-compile with WITH_GPU "
        "option");
  }
  return it->second.get();
}

DeviceContextPool::DeviceContextPool(
    const std::vector<platform::Place>& places) {
  PADDLE_ENFORCE_GT(places.size(), 0);
  using PtrType = std::unique_ptr<DeviceContext>;
  std::unordered_set<Place, PlaceHash> set;
  for (auto& p : places) {
    set.insert(p);
  }

  for (auto& p : set) {
    if (platform::is_cpu_place(p)) {
#ifdef PADDLE_WITH_MKLDNN
      device_contexts_.emplace(
          p, PtrType(new MKLDNNDeviceContext(boost::get<CPUPlace>(p))));
#else
      device_contexts_.emplace(
          p, PtrType(new CPUDeviceContext(boost::get<CPUPlace>(p))));
#endif
    } else if (platform::is_gpu_place(p)) {
#ifdef PADDLE_WITH_CUDA
      device_contexts_.emplace(
          p, PtrType(new CUDADeviceContext(boost::get<CUDAPlace>(p))));
#else
      PADDLE_THROW(
          "'CUDAPlace' is not supported, Please re-compile with WITH_GPU "
          "option");
#endif
    } else if (platform::is_cuda_pinned_place(p)) {
#ifdef PADDLE_WITH_CUDA
      device_contexts_.emplace(
          p,
          PtrType(new CUDAPinnedDeviceContext(boost::get<CUDAPinnedPlace>(p))));
#else
      PADDLE_THROW(
          "'CUDAPlace' is not supported, Please re-compile with WITH_GPU "
          "option");
#endif
    }
  }
}

CPUDeviceContext::CPUDeviceContext() {
  eigen_device_.reset(new Eigen::DefaultDevice());
}

CPUDeviceContext::CPUDeviceContext(CPUPlace place) : place_(place) {
  eigen_device_.reset(new Eigen::DefaultDevice());
}

Eigen::DefaultDevice* CPUDeviceContext::eigen_device() const {
  return eigen_device_.get();
}

Place CPUDeviceContext::GetPlace() const { return place_; }

#ifdef PADDLE_WITH_CUDA

class EigenCudaStreamDevice : public Eigen::StreamInterface {
 public:
  EigenCudaStreamDevice() : scratch_(nullptr), semaphore_(nullptr) {
    Eigen::initializeDeviceProp();
  }
  ~EigenCudaStreamDevice() override {}

  void Reinitialize(const cudaStream_t* cuda_stream, CUDAPlace place) {
    stream_ = cuda_stream;
    place_ = place;
    device_prop_ = &Eigen::m_deviceProperties[place.device];
  }

  const cudaStream_t& stream() const override { return *stream_; }

  const cudaDeviceProp& deviceProperties() const override {
    return *device_prop_;
  }

  void* allocate(size_t num_bytes) const override {
    return paddle::memory::Alloc(place_, num_bytes);
  }

  void deallocate(void* buffer) const override {
    paddle::memory::Free(place_, buffer);
  }

  void* scratchpad() const override {
    if (scratch_ == NULL) {
      scratch_ = allocate(Eigen::kCudaScratchSize + sizeof(unsigned int));
    }
    return scratch_;
  }

  unsigned int* semaphore() const override {
    if (semaphore_ == NULL) {
      char* scratch =
          static_cast<char*>(scratchpad()) + Eigen::kCudaScratchSize;
      semaphore_ = reinterpret_cast<unsigned int*>(scratch);
      PADDLE_ENFORCE(
          cudaMemsetAsync(semaphore_, 0, sizeof(unsigned int), *stream_));
    }
    return semaphore_;
  }

 private:
  CUDAPlace place_;
  const cudaStream_t* stream_;         // not owned;
  const cudaDeviceProp* device_prop_;  // not owned;
  mutable void* scratch_;
  mutable unsigned int* semaphore_;
};

CUDADeviceContext::CUDADeviceContext(CUDAPlace place) : place_(place) {
  SetDeviceId(place_.device);
  compute_capability = GetCUDAComputeCapability(place_.device);
  multi_process = GetCUDAMultiProcessors(place_.device);
  max_threads_per_mp = GetCUDAMaxThreadsPerMultiProcessor(place_.device);
  PADDLE_ENFORCE(cudaStreamCreate(&stream_));
  eigen_stream_.reset(new EigenCudaStreamDevice());
  eigen_stream_->Reinitialize(&stream_, place);
  eigen_device_.reset(new Eigen::GpuDevice(eigen_stream_.get()));
  PADDLE_ENFORCE(dynload::cublasCreate(&cublas_handle_));
  PADDLE_ENFORCE(dynload::cublasSetStream(cublas_handle_, stream_));
  if (dynload::HasCUDNN()) {
    PADDLE_ENFORCE(dynload::cudnnCreate(&cudnn_handle_));
    PADDLE_ENFORCE(dynload::cudnnSetStream(cudnn_handle_, stream_));
  } else {
    cudnn_handle_ = nullptr;
  }
}

CUDADeviceContext::~CUDADeviceContext() {
  SetDeviceId(place_.device);
  Wait();
  PADDLE_ENFORCE(dynload::cublasDestroy(cublas_handle_));
  if (cudnn_handle_ != nullptr) {
    PADDLE_ENFORCE(dynload::cudnnDestroy(cudnn_handle_));
  }
  eigen_stream_.reset();
  eigen_device_.reset();
  PADDLE_ENFORCE(cudaStreamDestroy(stream_));
}

Place CUDADeviceContext::GetPlace() const { return place_; }

void CUDADeviceContext::Wait() const {
  PADDLE_ENFORCE(cudaStreamSynchronize(stream_));
  PADDLE_ENFORCE(cudaGetLastError());
}

int CUDADeviceContext::GetComputeCapability() const {
  return compute_capability;
}

int CUDADeviceContext::GetMaxPhysicalThreadCount() const {
  return multi_process * max_threads_per_mp;
}

Eigen::GpuDevice* CUDADeviceContext::eigen_device() const {
  return eigen_device_.get();
}

cublasHandle_t CUDADeviceContext::cublas_handle() const {
  return cublas_handle_;
}

cudnnHandle_t CUDADeviceContext::cudnn_handle() const { return cudnn_handle_; }

cudaStream_t CUDADeviceContext::stream() const { return stream_; }

CUDAPinnedDeviceContext::CUDAPinnedDeviceContext() {
  eigen_device_.reset(new Eigen::DefaultDevice());
}

CUDAPinnedDeviceContext::CUDAPinnedDeviceContext(CUDAPinnedPlace place)
    : place_(place) {
  eigen_device_.reset(new Eigen::DefaultDevice());
}

Eigen::DefaultDevice* CUDAPinnedDeviceContext::eigen_device() const {
  return eigen_device_.get();
}

Place CUDAPinnedDeviceContext::GetPlace() const { return place_; }
#endif

#ifdef PADDLE_WITH_MKLDNN
MKLDNNDeviceContext::MKLDNNDeviceContext(CPUPlace place)
    : CPUDeviceContext(place), engine_(mkldnn::engine::cpu, 0), p_blobs_() {
  p_blobs_.reset(new std::unordered_map<std::string, std::shared_ptr<void>>());
}

void MKLDNNDeviceContext::SetBlob(const std::string& name,
                                  std::shared_ptr<void> data) const {
  std::unordered_map<std::string, std::shared_ptr<void>>* p;
  p = p_blobs_.get();

  auto it = p->find(name);

  if (it == p->end()) {
    (*p)[name] = data;  // create new blob
  } else {
    it->second = data;  // set data to existing blob
  }

  return;
}

std::shared_ptr<void> MKLDNNDeviceContext::GetBlob(
    const std::string& name) const {
  std::unordered_map<std::string, std::shared_ptr<void>>* p;
  p = p_blobs_.get();

  auto it = p->find(name);

  if (it != p->end()) {
    return it->second;
  }

  return nullptr;
}

#endif

}  // namespace platform
}  // namespace paddle
Fix the grammar in copyright. (#8403) 7 years ago			`/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.`
follow comments 8 years ago			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`
			`http://www.apache.org/licenses/LICENSE-2.0`
			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`
Correct #include path 7 years ago			`#include "paddle/fluid/platform/device_context.h"`
Fix part of the cpplint errors in fluid/platform (#9802) 7 years ago
			`#include <string>`
Enhance device context pool (#9293) 7 years ago			`#include <unordered_set>`
Fix part of the cpplint errors in fluid/platform (#9802) 7 years ago			`#include <vector>`

Correct #include path 7 years ago			`#include "paddle/fluid/memory/memory.h"`
Fix part of the cpplint errors in fluid/platform (#9802) 7 years ago
follow comments 8 years ago			`namespace paddle {`
			`namespace platform {`

Feature/operator run place (#6783) * "change operator interface" * "move devicepool to device_context" * "fix operator test" * "fix op_registry Run interface" * "net op passed. Need to fix nccl multi-Context" * "add nccl group function" * "add nccl group function" * "fix gpu count exceed 32 error" * "fix recurrent op, nccl op" * "change the other operators interface with Place" * "fix typo" * "fix pybind" * "fix device in python side" * "fix pybind failed" * "add init for test" * "fix CI" 7 years ago			`DeviceContextPool* DeviceContextPool::pool = nullptr;`

Enhance device context pool (#9293) 7 years ago			`platform::DeviceContext* DeviceContextPool::Get(const platform::Place& place) {`
Feature/operator run place (#6783) * "change operator interface" * "move devicepool to device_context" * "fix operator test" * "fix op_registry Run interface" * "net op passed. Need to fix nccl multi-Context" * "add nccl group function" * "add nccl group function" * "fix gpu count exceed 32 error" * "fix recurrent op, nccl op" * "change the other operators interface with Place" * "fix typo" * "fix pybind" * "fix device in python side" * "fix pybind failed" * "add init for test" * "fix CI" 7 years ago			`auto it = device_contexts_.find(place);`
			`if (it == device_contexts_.end()) {`
			`PADDLE_THROW(`
			`"'Place' is not supported, Please re-compile with WITH_GPU "`
			`"option");`
			`}`
Enhance device context pool (#9293) 7 years ago			`return it->second.get();`
Feature/operator run place (#6783) * "change operator interface" * "move devicepool to device_context" * "fix operator test" * "fix op_registry Run interface" * "net op passed. Need to fix nccl multi-Context" * "add nccl group function" * "add nccl group function" * "fix gpu count exceed 32 error" * "fix recurrent op, nccl op" * "change the other operators interface with Place" * "fix typo" * "fix pybind" * "fix device in python side" * "fix pybind failed" * "add init for test" * "fix CI" 7 years ago			`}`

			`DeviceContextPool::DeviceContextPool(`
			`const std::vector<platform::Place>& places) {`
			`PADDLE_ENFORCE_GT(places.size(), 0);`
Enhance device context pool (#9293) 7 years ago			`using PtrType = std::unique_ptr<DeviceContext>;`
			`std::unordered_set<Place, PlaceHash> set;`
			`for (auto& p : places) {`
			`set.insert(p);`
			`}`

			`for (auto& p : set) {`
			`if (platform::is_cpu_place(p)) {`
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`#ifdef PADDLE_WITH_MKLDNN`
Enhance device context pool (#9293) 7 years ago			`device_contexts_.emplace(`
			`p, PtrType(new MKLDNNDeviceContext(boost::get<CPUPlace>(p))));`
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`#else`
Enhance device context pool (#9293) 7 years ago			`device_contexts_.emplace(`
			`p, PtrType(new CPUDeviceContext(boost::get<CPUPlace>(p))));`
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`#endif`
Enhance device context pool (#9293) 7 years ago			`} else if (platform::is_gpu_place(p)) {`
Feature/operator run place (#6783) * "change operator interface" * "move devicepool to device_context" * "fix operator test" * "fix op_registry Run interface" * "net op passed. Need to fix nccl multi-Context" * "add nccl group function" * "add nccl group function" * "fix gpu count exceed 32 error" * "fix recurrent op, nccl op" * "change the other operators interface with Place" * "fix typo" * "fix pybind" * "fix device in python side" * "fix pybind failed" * "add init for test" * "fix CI" 7 years ago			`#ifdef PADDLE_WITH_CUDA`
Enhance device context pool (#9293) 7 years ago			`device_contexts_.emplace(`
			`p, PtrType(new CUDADeviceContext(boost::get<CUDAPlace>(p))));`
Feature/operator run place (#6783) * "change operator interface" * "move devicepool to device_context" * "fix operator test" * "fix op_registry Run interface" * "net op passed. Need to fix nccl multi-Context" * "add nccl group function" * "add nccl group function" * "fix gpu count exceed 32 error" * "fix recurrent op, nccl op" * "change the other operators interface with Place" * "fix typo" * "fix pybind" * "fix device in python side" * "fix pybind failed" * "add init for test" * "fix CI" 7 years ago			`#else`
			`PADDLE_THROW(`
GPUPlace to CUDAPlace (#6960) 7 years ago			`"'CUDAPlace' is not supported, Please re-compile with WITH_GPU "`
Feature/operator run place (#6783) * "change operator interface" * "move devicepool to device_context" * "fix operator test" * "fix op_registry Run interface" * "net op passed. Need to fix nccl multi-Context" * "add nccl group function" * "add nccl group function" * "fix gpu count exceed 32 error" * "fix recurrent op, nccl op" * "change the other operators interface with Place" * "fix typo" * "fix pybind" * "fix device in python side" * "fix pybind failed" * "add init for test" * "fix CI" 7 years ago			`"option");`
Add CUDAPinnedPlace 7 years ago			`#endif`
			`} else if (platform::is_cuda_pinned_place(p)) {`
			`#ifdef PADDLE_WITH_CUDA`
			`device_contexts_.emplace(`
			`p,`
			`PtrType(new CUDAPinnedDeviceContext(boost::get<CUDAPinnedPlace>(p))));`
			`#else`
			`PADDLE_THROW(`
			`"'CUDAPlace' is not supported, Please re-compile with WITH_GPU "`
			`"option");`
Feature/operator run place (#6783) * "change operator interface" * "move devicepool to device_context" * "fix operator test" * "fix op_registry Run interface" * "net op passed. Need to fix nccl multi-Context" * "add nccl group function" * "add nccl group function" * "fix gpu count exceed 32 error" * "fix recurrent op, nccl op" * "change the other operators interface with Place" * "fix typo" * "fix pybind" * "fix device in python side" * "fix pybind failed" * "add init for test" * "fix CI" 7 years ago			`#endif`
			`}`
			`}`
			`}`

Fix: refine device context and fix place() 8 years ago			`CPUDeviceContext::CPUDeviceContext() {`
			`eigen_device_.reset(new Eigen::DefaultDevice());`
			`}`

"small fix of Place" (#6766) 7 years ago			`CPUDeviceContext::CPUDeviceContext(CPUPlace place) : place_(place) {`
Fix: refine device context and fix place() 8 years ago			`eigen_device_.reset(new Eigen::DefaultDevice());`
			`}`

			`Eigen::DefaultDevice* CPUDeviceContext::eigen_device() const {`
			`return eigen_device_.get();`
			`}`

"small fix of Place" (#6766) 7 years ago			`Place CPUDeviceContext::GetPlace() const { return place_; }`
Fix: refine device context and fix place() 8 years ago
Use PADDLE_WITH_CUDA instead of PADDLE_WITH_GPU 7 years ago			`#ifdef PADDLE_WITH_CUDA`
Fix: refine device context and fix place() 8 years ago
init 8 years ago			`class EigenCudaStreamDevice : public Eigen::StreamInterface {`
			`public:`
			`EigenCudaStreamDevice() : scratch_(nullptr), semaphore_(nullptr) {`
			`Eigen::initializeDeviceProp();`
			`}`
			`~EigenCudaStreamDevice() override {}`

GPUPlace to CUDAPlace (#6960) 7 years ago			`void Reinitialize(const cudaStream_t* cuda_stream, CUDAPlace place) {`
init 8 years ago			`stream_ = cuda_stream;`
			`place_ = place;`
			`device_prop_ = &Eigen::m_deviceProperties[place.device];`
			`}`

			`const cudaStream_t& stream() const override { return *stream_; }`

			`const cudaDeviceProp& deviceProperties() const override {`
			`return *device_prop_;`
			`}`

			`void* allocate(size_t num_bytes) const override {`
fix gpu build error 8 years ago			`return paddle::memory::Alloc(place_, num_bytes);`
init 8 years ago			`}`

			`void deallocate(void* buffer) const override {`
			`paddle::memory::Free(place_, buffer);`
			`}`

			`void* scratchpad() const override {`
			`if (scratch_ == NULL) {`
			`scratch_ = allocate(Eigen::kCudaScratchSize + sizeof(unsigned int));`
			`}`
			`return scratch_;`
			`}`

			`unsigned int* semaphore() const override {`
			`if (semaphore_ == NULL) {`
			`char* scratch =`
			`static_cast<char*>(scratchpad()) + Eigen::kCudaScratchSize;`
			`semaphore_ = reinterpret_cast<unsigned int*>(scratch);`
			`PADDLE_ENFORCE(`
			`cudaMemsetAsync(semaphore_, 0, sizeof(unsigned int), *stream_));`
			`}`
			`return semaphore_;`
			`}`

			`private:`
GPUPlace to CUDAPlace (#6960) 7 years ago			`CUDAPlace place_;`
init 8 years ago			`const cudaStream_t* stream_; // not owned;`
			`const cudaDeviceProp* device_prop_; // not owned;`
fix gpu build error 8 years ago			`mutable void* scratch_;`
init 8 years ago			`mutable unsigned int* semaphore_;`
			`};`

GPUPlace to CUDAPlace (#6960) 7 years ago			`CUDADeviceContext::CUDADeviceContext(CUDAPlace place) : place_(place) {`
Fix: refine device context and fix place() 8 years ago			`SetDeviceId(place_.device);`
address comments 7 years ago			`compute_capability = GetCUDAComputeCapability(place_.device);`
fix bug for big number; float->double and code refine 7 years ago			`multi_process = GetCUDAMultiProcessors(place_.device);`
			`max_threads_per_mp = GetCUDAMaxThreadsPerMultiProcessor(place_.device);`
init 8 years ago			`PADDLE_ENFORCE(cudaStreamCreate(&stream_));`
			`eigen_stream_.reset(new EigenCudaStreamDevice());`
			`eigen_stream_->Reinitialize(&stream_, place);`
Fix: refine device context and fix place() 8 years ago			`eigen_device_.reset(new Eigen::GpuDevice(eigen_stream_.get()));`
Remove lazy-initialization in device_context * Also use `const DeviceContext&` all the time, to prevent `const_cast` Fix #4169 Fix #3468 Fix #3475 8 years ago			`PADDLE_ENFORCE(dynload::cublasCreate(&cublas_handle_));`
			`PADDLE_ENFORCE(dynload::cublasSetStream(cublas_handle_, stream_));`
"remove cudnn devicecontext" (#7207) * "remove cudnndevicecontext" * "remove unused init code" * "fix hash functions" 7 years ago			`if (dynload::HasCUDNN()) {`
			`PADDLE_ENFORCE(dynload::cudnnCreate(&cudnn_handle_));`
			`PADDLE_ENFORCE(dynload::cudnnSetStream(cudnn_handle_, stream_));`
			`} else {`
			`cudnn_handle_ = nullptr;`
			`}`
Fix: refine device context and fix place() 8 years ago			`}`

			`CUDADeviceContext::~CUDADeviceContext() {`
			`SetDeviceId(place_.device);`
FIX: name convention 8 years ago			`Wait();`
Remove lazy-initialization in device_context * Also use `const DeviceContext&` all the time, to prevent `const_cast` Fix #4169 Fix #3468 Fix #3475 8 years ago			`PADDLE_ENFORCE(dynload::cublasDestroy(cublas_handle_));`
"remove cudnn devicecontext" (#7207) * "remove cudnndevicecontext" * "remove unused init code" * "fix hash functions" 7 years ago			`if (cudnn_handle_ != nullptr) {`
			`PADDLE_ENFORCE(dynload::cudnnDestroy(cudnn_handle_));`
			`}`
Fix: refine device context and fix place() 8 years ago			`eigen_stream_.reset();`
			`eigen_device_.reset();`
init 8 years ago			`PADDLE_ENFORCE(cudaStreamDestroy(stream_));`
Fix: refine device context and fix place() 8 years ago			`}`

FIX: name convention 8 years ago			`Place CUDADeviceContext::GetPlace() const { return place_; }`
Fix: refine device context and fix place() 8 years ago
FIX: name convention 8 years ago			`void CUDADeviceContext::Wait() const {`
init 8 years ago			`PADDLE_ENFORCE(cudaStreamSynchronize(stream_));`
Check errors for the cuda kernel calls. (#5436) 7 years ago			`PADDLE_ENFORCE(cudaGetLastError());`
			`}`

address comments 7 years ago			`int CUDADeviceContext::GetComputeCapability() const {`
			`return compute_capability;`
			`}`

fix bug for big number; float->double and code refine 7 years ago			`int CUDADeviceContext::GetMaxPhysicalThreadCount() const {`
			`return multi_process * max_threads_per_mp;`
			`}`

Fix: refine device context and fix place() 8 years ago			`Eigen::GpuDevice* CUDADeviceContext::eigen_device() const {`
			`return eigen_device_.get();`
			`}`

Remove lazy-initialization in device_context * Also use `const DeviceContext&` all the time, to prevent `const_cast` Fix #4169 Fix #3468 Fix #3475 8 years ago			`cublasHandle_t CUDADeviceContext::cublas_handle() const {`
Fix: refine device context and fix place() 8 years ago			`return cublas_handle_;`
			`}`

Remove lazy-initialization in device_context * Also use `const DeviceContext&` all the time, to prevent `const_cast` Fix #4169 Fix #3468 Fix #3475 8 years ago			`cudnnHandle_t CUDADeviceContext::cudnn_handle() const { return cudnn_handle_; }`
Fix: refine device context and fix place() 8 years ago
Remove lazy-initialization in device_context * Also use `const DeviceContext&` all the time, to prevent `const_cast` Fix #4169 Fix #3468 Fix #3475 8 years ago			`cudaStream_t CUDADeviceContext::stream() const { return stream_; }`
refine random related ops 8 years ago
Add CUDAPinnedPlace 7 years ago			`CUDAPinnedDeviceContext::CUDAPinnedDeviceContext() {`
			`eigen_device_.reset(new Eigen::DefaultDevice());`
			`}`

			`CUDAPinnedDeviceContext::CUDAPinnedDeviceContext(CUDAPinnedPlace place)`
			`: place_(place) {`
			`eigen_device_.reset(new Eigen::DefaultDevice());`
			`}`

			`Eigen::DefaultDevice* CUDAPinnedDeviceContext::eigen_device() const {`
			`return eigen_device_.get();`
			`}`

			`Place CUDAPinnedDeviceContext::GetPlace() const { return place_; }`
remove unused PADDLE_ONLY_CPU comment 7 years ago			`#endif`
follow comments 8 years ago
add MKLDNNDeviceContext 7 years ago			`#ifdef PADDLE_WITH_MKLDNN`
			`MKLDNNDeviceContext::MKLDNNDeviceContext(CPUPlace place)`
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`: CPUDeviceContext(place), engine_(mkldnn::engine::cpu, 0), p_blobs_() {`
			`p_blobs_.reset(new std::unordered_map<std::string, std::shared_ptr<void>>());`
add MKLDNNDeviceContext 7 years ago			`}`

MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`void MKLDNNDeviceContext::SetBlob(const std::string& name,`
			`std::shared_ptr<void> data) const {`
			`std::unordered_map<std::string, std::shared_ptr<void>>* p;`
			`p = p_blobs_.get();`
add MKLDNNDeviceContext 7 years ago
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`auto it = p->find(name);`
add MKLDNNDeviceContext 7 years ago
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`if (it == p->end()) {`
			`(*p)[name] = data; // create new blob`
			`} else {`
			`it->second = data; // set data to existing blob`
			`}`
add MKLDNNDeviceContext 7 years ago
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`return;`
add MKLDNNDeviceContext 7 years ago			`}`

MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`std::shared_ptr<void> MKLDNNDeviceContext::GetBlob(`
			`const std::string& name) const {`
			`std::unordered_map<std::string, std::shared_ptr<void>>* p;`
			`p = p_blobs_.get();`
add MKLDNNDeviceContext 7 years ago
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`auto it = p->find(name);`
add MKLDNNDeviceContext 7 years ago
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago			`if (it != p->end()) {`
			`return it->second;`
add MKLDNNDeviceContext 7 years ago			`}`
MKLDNN conv2d kernel added (#8451) * MKLDNN conv2 OP kernel added * TODOs added * mkldnn conv2d OP refactor * CanCUDNNBeUsed and CanMKLDNNBeUsed moved 7 years ago
			`return nullptr;`
add MKLDNNDeviceContext 7 years ago			`}`

			`#endif`

follow comments 8 years ago			`} // namespace platform`
follow comments 8 years ago			`} // namespace paddle`