From e1ed3b9c15eb1e99d981f0a9e6d9fb29a997290f Mon Sep 17 00:00:00 2001
From: TFBunny <shuo.jia@huawei.com>
Date: Fri, 12 Feb 2021 16:17:16 -0500
Subject: [PATCH] add float64 support to assign GPU

---
 .../gpu/other/assign_gpu_kernel.cc            |  6 +++++-
 .../gpu/other/assign_gpu_kernel.h             | 12 +++++------
 tests/st/ops/gpu/test_assign_op.py            | 20 ++++++++++++++++++-
 3 files changed, 30 insertions(+), 8 deletions(-)
diff --git a/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.cc b/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.cc
index b17a55c37c..06a329dc2d 100644
--- a/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.cc
+++ b/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.cc
@@ -1,5 +1,5 @@
 /**
- * Copyright 2020 Huawei Technologies Co., Ltd
+ * Copyright 2020-2021 Huawei Technologies Co., Ltd
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,6 +18,10 @@
 
 namespace mindspore {
 namespace kernel {
+MS_REG_GPU_KERNEL_ONE(
+  Assign,
+  KernelAttr().AddInputAttr(kNumberTypeFloat64).AddInputAttr(kNumberTypeFloat64).AddOutputAttr(kNumberTypeFloat64),
+  AssignGpuKernel, double)
 MS_REG_GPU_KERNEL_ONE(
   Assign,
   KernelAttr().AddInputAttr(kNumberTypeFloat32).AddInputAttr(kNumberTypeFloat32).AddOutputAttr(kNumberTypeFloat32),
diff --git a/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.h b/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.h
index 1333513e29..324258ed94 100644
--- a/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.h
+++ b/mindspore/ccsrc/backend/kernel_compiler/gpu/other/assign_gpu_kernel.h
@@ -1,5 +1,5 @@
 /**
- * Copyright 2020 Huawei Technologies Co., Ltd
+ * Copyright 2020-2021 Huawei Technologies Co., Ltd
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -14,8 +14,8 @@
  * limitations under the License.
  */
 
-#ifndef MINDSPORE_CCSRC_BACKEND_KERNEL_COMPILER_GPU_ASSIGN_GPU_KERNEL_H
-#define MINDSPORE_CCSRC_BACKEND_KERNEL_COMPILER_GPU_ASSIGN_GPU_KERNEL_H
+#ifndef MINDSPORE_CCSRC_BACKEND_KERNEL_COMPILER_GPU_OTHER_ASSIGN_GPU_KERNEL_H_
+#define MINDSPORE_CCSRC_BACKEND_KERNEL_COMPILER_GPU_OTHER_ASSIGN_GPU_KERNEL_H_
 
 #include <vector>
 #include "backend/kernel_compiler/gpu/gpu_kernel.h"
@@ -40,11 +40,11 @@ class AssignGpuKernel : public GpuKernel {
     CHECK_CUDA_RET_WITH_EXCEPT(
       kernel_node_,
       cudaMemcpyAsync(var, value, input_size_, cudaMemcpyDeviceToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)),
-      "cudaMemxcpyAsync failed.");
+      "cudaMemcpyAsync failed.");
     CHECK_CUDA_RET_WITH_EXCEPT(
       kernel_node_,
       cudaMemcpyAsync(output, value, input_size_, cudaMemcpyDeviceToDevice, reinterpret_cast<cudaStream_t>(stream_ptr)),
-      "cudaMemxcpyAsync failed.");
+      "cudaMemcpyAsync failed.");
     return true;
   }
 
@@ -93,4 +93,4 @@ class AssignGpuKernel : public GpuKernel {
 }  // namespace kernel
 }  // namespace mindspore
 
-#endif  // MINDSPORE_CCSRC_BACKEND_KERNEL_COMPILER_GPU_ASSIGN_GPU_KERNEL_H
+#endif  // MINDSPORE_CCSRC_BACKEND_KERNEL_COMPILER_GPU_OTHER_ASSIGN_GPU_KERNEL_H_
diff --git a/tests/st/ops/gpu/test_assign_op.py b/tests/st/ops/gpu/test_assign_op.py
index 251d07ca93..c08337a176 100644
--- a/tests/st/ops/gpu/test_assign_op.py
+++ b/tests/st/ops/gpu/test_assign_op.py
@@ -1,4 +1,4 @@
-# Copyright 2020 Huawei Technologies Co., Ltd
+# Copyright 2020-2021 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -52,3 +52,21 @@ def test_assign():
     assert np.all(-diff1 < error)
     assert np.all(diff2 < error)
     assert np.all(-diff2 < error)
+
+
+@pytest.mark.level0
+@pytest.mark.platform_x86_gpu_training
+@pytest.mark.env_onecard
+def test_assign_float64():
+    context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
+    var = Tensor(x.astype(np.float64))
+    assign = Net(var)
+    output = assign(Tensor(value.astype(np.float64)))
+
+    error = np.ones(shape=[2, 2]) * 1.0e-6
+    diff1 = output.asnumpy() - value
+    diff2 = assign.var.data.asnumpy() - value
+    assert np.all(diff1 < error)
+    assert np.all(-diff1 < error)
+    assert np.all(diff2 < error)
+    assert np.all(-diff2 < error)