Paddle/paddle/fluid/operators/mkldnn/lrn_mkldnn_op.cc

/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/fluid/platform/mkldnn_reuse.h"

namespace paddle {
namespace framework {
class Tensor;
}  // namespace framework
namespace platform {
class MKLDNNDeviceContext;
}  // namespace platform
}  // namespace paddle

namespace paddle {
namespace operators {

using paddle::framework::Tensor;
using paddle::platform::MKLDNNDeviceContext;

template <typename T>
class LRNMKLDNNOpKernel : public paddle::framework::OpKernel<T> {
 public:
  void Compute(const paddle::framework::ExecutionContext& ctx) const override {
    const bool is_float_type = std::is_same<T, float>::value;
    PADDLE_ENFORCE_EQ(
        is_float_type, true,
        platform::errors::PreconditionNotMet("DNNL LRN must use float data."));
    PADDLE_ENFORCE_EQ(platform::is_cpu_place(ctx.GetPlace()), true,
                      paddle::platform::errors::PreconditionNotMet(
                          "Operator DNNL LRN must use CPUPlace"));
    auto& dev_ctx =
        ctx.template device_context<platform::MKLDNNDeviceContext>();
    const auto& mkldnn_engine = dev_ctx.GetEngine();

    auto x = ctx.Input<Tensor>("X");
    auto out = ctx.Output<Tensor>("Out");
    auto mid = ctx.Output<Tensor>("MidOut");

    platform::LRNMKLDNNHandler<T> handler(
        ctx, dev_ctx, mkldnn_engine, ctx.GetPlace(), x, ctx.OutputName("Out"));

    auto src_memory = handler.AcquireSrcMemory(x);
    auto dst_memory = handler.AcquireDstMemory(out);

    auto lrn_p = handler.AcquireForwardPrimitive();

    auto workspace_memory = handler.AcquireWorkspaceMemory(mid);
    mid->set_layout(framework::DataLayout::kMKLDNN);

    mkldnn::stream astream(dev_ctx.GetEngine());
    if (!workspace_memory->get_desc().is_zero()) {
      mid->set_format(platform::GetMKLDNNFormat(*workspace_memory));
      lrn_p->execute(astream, {{MKLDNN_ARG_SRC, *src_memory},
                               {MKLDNN_ARG_DST, *dst_memory},
                               {MKLDNN_ARG_WORKSPACE, *workspace_memory}});
    } else {
      lrn_p->execute(astream, {{MKLDNN_ARG_SRC, *src_memory},
                               {MKLDNN_ARG_DST, *dst_memory}});
    }
    astream.wait();

    out->set_layout(framework::DataLayout::kMKLDNN);
    out->set_format(platform::GetMKLDNNFormat(*dst_memory));
  }
};

template <typename T>
class LRNMKLDNNGradOpKernel : public paddle::framework::OpKernel<T> {
 public:
  void Compute(const paddle::framework::ExecutionContext& ctx) const override {
    const bool is_float_type = std::is_same<T, float>::value;
    PADDLE_ENFORCE_EQ(is_float_type, true,
                      platform::errors::PreconditionNotMet(
                          "DNNL LRN GradOpKernel must use float data."));
    PADDLE_ENFORCE_EQ(platform::is_cpu_place(ctx.GetPlace()), true,
                      paddle::platform::errors::PreconditionNotMet(
                          "Operator DNNL LRNGrad must use CPUPlace"));
    PADDLE_ENFORCE_EQ(
        ctx.Attr<bool>("is_test"), false,
        platform::errors::PreconditionNotMet(
            "is_test attribute should be set to False in training phase."));

    auto x = ctx.Input<Tensor>("X");
    auto mid = ctx.Input<Tensor>("MidOut");

    auto out_grad = ctx.Input<Tensor>(framework::GradVarName("Out"));
    auto x_grad = ctx.Output<Tensor>(framework::GradVarName("X"));

    const int n = ctx.Attr<int>("n");
    const float alpha = ctx.Attr<float>("alpha") * static_cast<float>(n);
    const float beta = ctx.Attr<float>("beta");
    const float k = ctx.Attr<float>("k");

    auto& dev_ctx = ctx.template device_context<MKLDNNDeviceContext>();

    auto dims = paddle::framework::vectorize<int64_t>(x->dims());

    platform::LRNMKLDNNHandler<T> handler(dims, n, alpha, beta, k, x->format(),
                                          out_grad->format(), dev_ctx,
                                          ctx.GetPlace(), ctx.InputName("Out"));

    auto src_memory = handler.AcquireSrcMemory(x);
    auto workspace = handler.AcquireBackwardWorkspaceMemory(mid);
    auto diff_dst_memory = handler.AcquireDiffDstMemory(out_grad);
    auto diff_src_memory = handler.AcquireDiffSrcMemory(x_grad);

    auto lrn_bwd = handler.AcquireBackwardPrimitive();

    mkldnn::stream astream(dev_ctx.GetEngine());
    lrn_bwd->execute(astream, {{MKLDNN_ARG_SRC, *src_memory},
                               {MKLDNN_ARG_DIFF_DST, *diff_dst_memory},
                               {MKLDNN_ARG_DIFF_SRC, *diff_src_memory},
                               {MKLDNN_ARG_WORKSPACE, *workspace}});
    astream.wait();

    x_grad->set_layout(framework::DataLayout::kMKLDNN);
    x_grad->set_format(platform::GetMKLDNNFormat(*diff_src_memory));
  }
};
}  // namespace operators
}  // namespace paddle

namespace ops = paddle::operators;

REGISTER_OP_KERNEL(lrn, MKLDNN, paddle::platform::CPUPlace,
                   ops::LRNMKLDNNOpKernel<float>);
REGISTER_OP_KERNEL(lrn_grad, MKLDNN, paddle::platform::CPUPlace,
                   ops::LRNMKLDNNGradOpKernel<float>);
Implementation of MKLDNN LRN 7 years ago			`/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserve.`

			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License. */`

[MKL-DNN] Extended LRN with reusing via Acquire API (#18675) test=develop - compileation fix - Yet another compilation fix - Even yet another compilation fix - Surprise! Again compilation fix - lint fixes test=develop - Fix to workspace acquire of LRN test=develop - Fix to hash of BWD LRN test=develop - fix to lrn BWD PD acquire test=develop - Fixing LRN PD creation test=develop - cosmetic fix in comment test=develop - Fixes after review test=develop 6 years ago			`#include "paddle/fluid/platform/mkldnn_reuse.h"`
Implementation of MKLDNN LRN 7 years ago
use iwyu clean include (#27267) * use iwyu clean include, test=develop, test=win * compilation error, test=develop * fix compilation error2, test=develop * fix compilation error3, test=develop * fix compilation error4, test=develop * fix compilation error5, test=develop * fix compilation error6, test=develop * fix compilation error7, test=develop * fix compilation error8, test=develop * fix compilation error8, test=develop * fix compilation error10, test=develop * fix compilation error11, test=develop 4 years ago			`namespace paddle {`
			`namespace framework {`
			`class Tensor;`
			`} // namespace framework`
			`namespace platform {`
			`class MKLDNNDeviceContext;`
			`} // namespace platform`
			`} // namespace paddle`

Implementation of MKLDNN LRN 7 years ago			`namespace paddle {`
			`namespace operators {`

			`using paddle::framework::Tensor;`
			`using paddle::platform::MKLDNNDeviceContext;`

			`template <typename T>`
			`class LRNMKLDNNOpKernel : public paddle::framework::OpKernel<T> {`
			`public:`
			`void Compute(const paddle::framework::ExecutionContext& ctx) const override {`
Avoid comma in macro test=develop 6 years ago			`const bool is_float_type = std::is_same<T, float>::value;`
Update PADDLE_ENFORCE in DNNL related ops (#24333) * Update PADDLE_ENFORCE in DNNL related ops test=develop * Abstract macro of OP_GET_PLACE_CHECK test=develop * update according to reviews * update GET_PLACE_CPU_CHECK * fix typo test=develop * revert macro test=develop 5 years ago			`PADDLE_ENFORCE_EQ(`
			`is_float_type, true,`
			`platform::errors::PreconditionNotMet("DNNL LRN must use float data."));`
			`PADDLE_ENFORCE_EQ(platform::is_cpu_place(ctx.GetPlace()), true,`
			`paddle::platform::errors::PreconditionNotMet(`
			`"Operator DNNL LRN must use CPUPlace"));`
Add isCached() mechanism for BatchNorm and LRN oneDNN operators (#24798) * Add isCached() mechanism for BatchNorm and LRN oneDNN operators test=develop * Formatting fix test=develop 5 years ago			`auto& dev_ctx =`
			`ctx.template device_context<platform::MKLDNNDeviceContext>();`
			`const auto& mkldnn_engine = dev_ctx.GetEngine();`
Implementation of MKLDNN LRN 7 years ago
			`auto x = ctx.Input<Tensor>("X");`
			`auto out = ctx.Output<Tensor>("Out");`
			`auto mid = ctx.Output<Tensor>("MidOut");`

Add isCached() mechanism for BatchNorm and LRN oneDNN operators (#24798) * Add isCached() mechanism for BatchNorm and LRN oneDNN operators test=develop * Formatting fix test=develop 5 years ago			`platform::LRNMKLDNNHandler<T> handler(`
			`ctx, dev_ctx, mkldnn_engine, ctx.GetPlace(), x, ctx.OutputName("Out"));`
[MKL-DNN] LRN refactoring (#19798) - LRN mkl-dnn kernel refactor test=develop - compilation fix - Another compilation fix - Compilation fix - another compilation fix - compilation fix - Crash fix - optional LRN mkldnn workspace - Added mid allocation - Workaround for tests - Removed gradient from is_test ut - Removed mid for inference - Reverted LRN mid removal for is_test - PADDLE_ENFORCE adjusted - Rebase to templatization commit - Compilation fix - compilation fix test=develop - lint test=develop - Fix to crash - Rebase to recent codebase - lin - lint - compilation fix 6 years ago
			`auto src_memory = handler.AcquireSrcMemory(x);`
			`auto dst_memory = handler.AcquireDstMemory(out);`

MKL-DNN 1.0 Update (#20162) * MKLDNN v1.0 rebase to Paddle 1.6 test=develop * Add hacky paddle::string::to_string() implementation * vectorize<int64-t>() -> vectorize() cleanup test=develop * PADDLE_ENFORCE and void_cast fixes test=develop * Rebase changes test=develop * Cosmetics test=develop * Delete MKL from mkldnn.cmake test=develop * CMake debug commands test=develop * Delete MKLDNN_VERBOSE and rebase fixes test=develop * Rebase fixes test=develop * Temporarily disable int8 resnet101 vgg16 and vgg19 tests test=develop * Add libmkldnn.so.1 to python setup test=develop * Add libmkldnn.so.1 to inference_lib cmake after rebase test=develop * Post rebase fixes + FC int8 changes test=develop * Fix LRN NHWC test=develop * Fix NHWC conv3d test=develop * Windows build fix + next conv3d fix test=develop * Fix conv2d on AVX2 machines test=develop 5 years ago			`auto lrn_p = handler.AcquireForwardPrimitive();`

			`auto workspace_memory = handler.AcquireWorkspaceMemory(mid);`
			`mid->set_layout(framework::DataLayout::kMKLDNN);`

			`mkldnn::stream astream(dev_ctx.GetEngine());`
			`if (!workspace_memory->get_desc().is_zero()) {`
[MKL-DNN] LRN and Pool2d (FWD) NHWC support (#21375) 5 years ago			`mid->set_format(platform::GetMKLDNNFormat(*workspace_memory));`
MKL-DNN 1.0 Update (#20162) * MKLDNN v1.0 rebase to Paddle 1.6 test=develop * Add hacky paddle::string::to_string() implementation * vectorize<int64-t>() -> vectorize() cleanup test=develop * PADDLE_ENFORCE and void_cast fixes test=develop * Rebase changes test=develop * Cosmetics test=develop * Delete MKL from mkldnn.cmake test=develop * CMake debug commands test=develop * Delete MKLDNN_VERBOSE and rebase fixes test=develop * Rebase fixes test=develop * Temporarily disable int8 resnet101 vgg16 and vgg19 tests test=develop * Add libmkldnn.so.1 to python setup test=develop * Add libmkldnn.so.1 to inference_lib cmake after rebase test=develop * Post rebase fixes + FC int8 changes test=develop * Fix LRN NHWC test=develop * Fix NHWC conv3d test=develop * Windows build fix + next conv3d fix test=develop * Fix conv2d on AVX2 machines test=develop 5 years ago			`lrn_p->execute(astream, {{MKLDNN_ARG_SRC, *src_memory},`
			`{MKLDNN_ARG_DST, *dst_memory},`
			`{MKLDNN_ARG_WORKSPACE, *workspace_memory}});`
[MKL-DNN] LRN refactoring (#19798) - LRN mkl-dnn kernel refactor test=develop - compilation fix - Another compilation fix - Compilation fix - another compilation fix - compilation fix - Crash fix - optional LRN mkldnn workspace - Added mid allocation - Workaround for tests - Removed gradient from is_test ut - Removed mid for inference - Reverted LRN mid removal for is_test - PADDLE_ENFORCE adjusted - Rebase to templatization commit - Compilation fix - compilation fix test=develop - lint test=develop - Fix to crash - Rebase to recent codebase - lin - lint - compilation fix 6 years ago			`} else {`
MKL-DNN 1.0 Update (#20162) * MKLDNN v1.0 rebase to Paddle 1.6 test=develop * Add hacky paddle::string::to_string() implementation * vectorize<int64-t>() -> vectorize() cleanup test=develop * PADDLE_ENFORCE and void_cast fixes test=develop * Rebase changes test=develop * Cosmetics test=develop * Delete MKL from mkldnn.cmake test=develop * CMake debug commands test=develop * Delete MKLDNN_VERBOSE and rebase fixes test=develop * Rebase fixes test=develop * Temporarily disable int8 resnet101 vgg16 and vgg19 tests test=develop * Add libmkldnn.so.1 to python setup test=develop * Add libmkldnn.so.1 to inference_lib cmake after rebase test=develop * Post rebase fixes + FC int8 changes test=develop * Fix LRN NHWC test=develop * Fix NHWC conv3d test=develop * Windows build fix + next conv3d fix test=develop * Fix conv2d on AVX2 machines test=develop 5 years ago			`lrn_p->execute(astream, {{MKLDNN_ARG_SRC, *src_memory},`
			`{MKLDNN_ARG_DST, *dst_memory}});`
			`}`
			`astream.wait();`
[MKL-DNN] Extended LRN with reusing via Acquire API (#18675) test=develop - compileation fix - Yet another compilation fix - Even yet another compilation fix - Surprise! Again compilation fix - lint fixes test=develop - Fix to workspace acquire of LRN test=develop - Fix to hash of BWD LRN test=develop - fix to lrn BWD PD acquire test=develop - Fixing LRN PD creation test=develop - cosmetic fix in comment test=develop - Fixes after review test=develop 6 years ago
			`out->set_layout(framework::DataLayout::kMKLDNN);`
Minor GetMKLDNNFormat changes (#20055) test=develop 5 years ago			`out->set_format(platform::GetMKLDNNFormat(*dst_memory));`
Implementation of MKLDNN LRN 7 years ago			`}`
			`};`

			`template <typename T>`
			`class LRNMKLDNNGradOpKernel : public paddle::framework::OpKernel<T> {`
			`public:`
			`void Compute(const paddle::framework::ExecutionContext& ctx) const override {`
Avoid comma in macro test=develop 6 years ago			`const bool is_float_type = std::is_same<T, float>::value;`
Update PADDLE_ENFORCE in DNNL related ops (#24333) * Update PADDLE_ENFORCE in DNNL related ops test=develop * Abstract macro of OP_GET_PLACE_CHECK test=develop * update according to reviews * update GET_PLACE_CPU_CHECK * fix typo test=develop * revert macro test=develop 5 years ago			`PADDLE_ENFORCE_EQ(is_float_type, true,`
			`platform::errors::PreconditionNotMet(`
[oneDNN] LRN cleanup (#25416) 5 years ago			`"DNNL LRN GradOpKernel must use float data."));`
Update PADDLE_ENFORCE in DNNL related ops (#24333) * Update PADDLE_ENFORCE in DNNL related ops test=develop * Abstract macro of OP_GET_PLACE_CHECK test=develop * update according to reviews * update GET_PLACE_CPU_CHECK * fix typo test=develop * revert macro test=develop 5 years ago			`PADDLE_ENFORCE_EQ(platform::is_cpu_place(ctx.GetPlace()), true,`
			`paddle::platform::errors::PreconditionNotMet(`
			`"Operator DNNL LRNGrad must use CPUPlace"));`
			`PADDLE_ENFORCE_EQ(`
			`ctx.Attr<bool>("is_test"), false,`
			`platform::errors::PreconditionNotMet(`
			`"is_test attribute should be set to False in training phase."));`
Implementation of MKLDNN LRN 7 years ago
			`auto x = ctx.Input<Tensor>("X");`
[MKL-DNN] LRN refactoring (#19798) - LRN mkl-dnn kernel refactor test=develop - compilation fix - Another compilation fix - Compilation fix - another compilation fix - compilation fix - Crash fix - optional LRN mkldnn workspace - Added mid allocation - Workaround for tests - Removed gradient from is_test ut - Removed mid for inference - Reverted LRN mid removal for is_test - PADDLE_ENFORCE adjusted - Rebase to templatization commit - Compilation fix - compilation fix test=develop - lint test=develop - Fix to crash - Rebase to recent codebase - lin - lint - compilation fix 6 years ago			`auto mid = ctx.Input<Tensor>("MidOut");`
Implementation of MKLDNN LRN 7 years ago
			`auto out_grad = ctx.Input<Tensor>(framework::GradVarName("Out"));`
			`auto x_grad = ctx.Output<Tensor>(framework::GradVarName("X"));`

			`const int n = ctx.Attr<int>("n");`
- Compensation fix to LRN MKL-DNN op test=develop 6 years ago			`const float alpha = ctx.Attr<float>("alpha") * static_cast<float>(n);`
Implementation of MKLDNN LRN 7 years ago			`const float beta = ctx.Attr<float>("beta");`
			`const float k = ctx.Attr<float>("k");`

			`auto& dev_ctx = ctx.template device_context<MKLDNNDeviceContext>();`

MKL-DNN 1.0 Update (#20162) * MKLDNN v1.0 rebase to Paddle 1.6 test=develop * Add hacky paddle::string::to_string() implementation * vectorize<int64-t>() -> vectorize() cleanup test=develop * PADDLE_ENFORCE and void_cast fixes test=develop * Rebase changes test=develop * Cosmetics test=develop * Delete MKL from mkldnn.cmake test=develop * CMake debug commands test=develop * Delete MKLDNN_VERBOSE and rebase fixes test=develop * Rebase fixes test=develop * Temporarily disable int8 resnet101 vgg16 and vgg19 tests test=develop * Add libmkldnn.so.1 to python setup test=develop * Add libmkldnn.so.1 to inference_lib cmake after rebase test=develop * Post rebase fixes + FC int8 changes test=develop * Fix LRN NHWC test=develop * Fix NHWC conv3d test=develop * Windows build fix + next conv3d fix test=develop * Fix conv2d on AVX2 machines test=develop 5 years ago			`auto dims = paddle::framework::vectorize<int64_t>(x->dims());`
Implementation of MKLDNN LRN 7 years ago
Add dygraph execution context (#20157) * add_dygraph_execution_context * add dygraph infershape context and execution context; test=develop * fix imperative bug; test=develop * remove inputs outputs interface from execution context, because it have same function with inputNames; test=develop * remove tracer_test ctest; test=develop * fix split op bug; test=develop * fix unitests bug; test=develop * fix distribute test bug; test=develop * fix ngraph compile bug; test=develop * fix grad maker bug; test=develop * fix load op bugs; test=develop * fix operator.cc construct bug; test=develop * remove useless name find in operator; test=develop * add tracer_test; test=develop * fix concat, split bug; test=develop * remove tracer_test unitest; test=develop * fix attribute check bug; test=develop * add test code to fix converage; test=develop * remove useless code, change check backward input in engin; test=develop * unlock var type infer shape;test=develop * add ShareAllLoD api; test=develop * add dygraph infershape context unitest; test=develop * remove increase and decrease lod in dygraph; test=develop * addd override; test=develop * fix increase descrease lod; test=develop * fix paddle_enforce; test=develop * disable lod op dygraph check; test=develop * fix paddle enforce error; test=develop * add comment for op_registry and OperatorBase; test=develop * optimize the comment of op_registry; test=develop * fix format of comment; test=develop * fix format of comment; test=develop * optimize the format of comment; test=develop * optimize the format of the comment; test=develop * optimize comment of op_registry; test=develop 5 years ago			`platform::LRNMKLDNNHandler<T> handler(dims, n, alpha, beta, k, x->format(),`
			`out_grad->format(), dev_ctx,`
			`ctx.GetPlace(), ctx.InputName("Out"));`
Implementation of MKLDNN LRN 7 years ago
[MKL-DNN] LRN refactoring (#19798) - LRN mkl-dnn kernel refactor test=develop - compilation fix - Another compilation fix - Compilation fix - another compilation fix - compilation fix - Crash fix - optional LRN mkldnn workspace - Added mid allocation - Workaround for tests - Removed gradient from is_test ut - Removed mid for inference - Reverted LRN mid removal for is_test - PADDLE_ENFORCE adjusted - Rebase to templatization commit - Compilation fix - compilation fix test=develop - lint test=develop - Fix to crash - Rebase to recent codebase - lin - lint - compilation fix 6 years ago			`auto src_memory = handler.AcquireSrcMemory(x);`
			`auto workspace = handler.AcquireBackwardWorkspaceMemory(mid);`
			`auto diff_dst_memory = handler.AcquireDiffDstMemory(out_grad);`
			`auto diff_src_memory = handler.AcquireDiffSrcMemory(x_grad);`
Implementation of MKLDNN LRN 7 years ago
MKL-DNN 1.0 Update (#20162) * MKLDNN v1.0 rebase to Paddle 1.6 test=develop * Add hacky paddle::string::to_string() implementation * vectorize<int64-t>() -> vectorize() cleanup test=develop * PADDLE_ENFORCE and void_cast fixes test=develop * Rebase changes test=develop * Cosmetics test=develop * Delete MKL from mkldnn.cmake test=develop * CMake debug commands test=develop * Delete MKLDNN_VERBOSE and rebase fixes test=develop * Rebase fixes test=develop * Temporarily disable int8 resnet101 vgg16 and vgg19 tests test=develop * Add libmkldnn.so.1 to python setup test=develop * Add libmkldnn.so.1 to inference_lib cmake after rebase test=develop * Post rebase fixes + FC int8 changes test=develop * Fix LRN NHWC test=develop * Fix NHWC conv3d test=develop * Windows build fix + next conv3d fix test=develop * Fix conv2d on AVX2 machines test=develop 5 years ago			`auto lrn_bwd = handler.AcquireBackwardPrimitive();`
Implementation of MKLDNN LRN 7 years ago
MKL-DNN 1.0 Update (#20162) * MKLDNN v1.0 rebase to Paddle 1.6 test=develop * Add hacky paddle::string::to_string() implementation * vectorize<int64-t>() -> vectorize() cleanup test=develop * PADDLE_ENFORCE and void_cast fixes test=develop * Rebase changes test=develop * Cosmetics test=develop * Delete MKL from mkldnn.cmake test=develop * CMake debug commands test=develop * Delete MKLDNN_VERBOSE and rebase fixes test=develop * Rebase fixes test=develop * Temporarily disable int8 resnet101 vgg16 and vgg19 tests test=develop * Add libmkldnn.so.1 to python setup test=develop * Add libmkldnn.so.1 to inference_lib cmake after rebase test=develop * Post rebase fixes + FC int8 changes test=develop * Fix LRN NHWC test=develop * Fix NHWC conv3d test=develop * Windows build fix + next conv3d fix test=develop * Fix conv2d on AVX2 machines test=develop 5 years ago			`mkldnn::stream astream(dev_ctx.GetEngine());`
			`lrn_bwd->execute(astream, {{MKLDNN_ARG_SRC, *src_memory},`
			`{MKLDNN_ARG_DIFF_DST, *diff_dst_memory},`
			`{MKLDNN_ARG_DIFF_SRC, *diff_src_memory},`
			`{MKLDNN_ARG_WORKSPACE, *workspace}});`
			`astream.wait();`
[MKL-DNN] Extended LRN with reusing via Acquire API (#18675) test=develop - compileation fix - Yet another compilation fix - Even yet another compilation fix - Surprise! Again compilation fix - lint fixes test=develop - Fix to workspace acquire of LRN test=develop - Fix to hash of BWD LRN test=develop - fix to lrn BWD PD acquire test=develop - Fixing LRN PD creation test=develop - cosmetic fix in comment test=develop - Fixes after review test=develop 6 years ago
			`x_grad->set_layout(framework::DataLayout::kMKLDNN);`
Minor GetMKLDNNFormat changes (#20055) test=develop 5 years ago			`x_grad->set_format(platform::GetMKLDNNFormat(*diff_src_memory));`
Implementation of MKLDNN LRN 7 years ago			`}`
			`};`
			`} // namespace operators`
			`} // namespace paddle`

			`namespace ops = paddle::operators;`

			`REGISTER_OP_KERNEL(lrn, MKLDNN, paddle::platform::CPUPlace,`
			`ops::LRNMKLDNNOpKernel<float>);`
			`REGISTER_OP_KERNEL(lrn_grad, MKLDNN, paddle::platform::CPUPlace,`
			`ops::LRNMKLDNNGradOpKernel<float>);`