You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							136 lines
						
					
					
						
							3.1 KiB
						
					
					
				
			
		
		
	
	
							136 lines
						
					
					
						
							3.1 KiB
						
					
					
				| /* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.
 | |
| 
 | |
| Licensed under the Apache License, Version 2.0 (the "License");
 | |
| you may not use this file except in compliance with the License.
 | |
| You may obtain a copy of the License at
 | |
| 
 | |
|     http://www.apache.org/licenses/LICENSE-2.0
 | |
| 
 | |
| Unless required by applicable law or agreed to in writing, software
 | |
| distributed under the License is distributed on an "AS IS" BASIS,
 | |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| See the License for the specific language governing permissions and
 | |
| limitations under the License. */
 | |
| 
 | |
| #ifndef MATHFUNCTIONS_H_
 | |
| #define MATHFUNCTIONS_H_
 | |
| 
 | |
| #ifdef PADDLE_USE_MKLML
 | |
| #include <mkl_cblas.h>
 | |
| #include <mkl_lapacke.h>
 | |
| #include <mkl_vml_functions.h>
 | |
| #endif
 | |
| 
 | |
| #ifdef PADDLE_USE_MKL
 | |
| #include <mkl.h>
 | |
| #include <mkl_lapacke.h>
 | |
| #endif
 | |
| 
 | |
| #if defined(PADDLE_USE_ATLAS) || defined(PADDLE_USE_VECLIB)
 | |
| extern "C" {
 | |
| #include <cblas.h>
 | |
| #include <clapack.h>
 | |
| }
 | |
| #endif
 | |
| 
 | |
| #ifdef PADDLE_USE_OPENBLAS
 | |
| #include <cblas.h>
 | |
| #include <lapacke.h>
 | |
| #endif
 | |
| 
 | |
| #ifndef LAPACK_FOUND
 | |
| extern "C" {
 | |
| #ifndef PADDLE_USE_EIGEN_FOR_BLAS
 | |
| #include <cblas.h>
 | |
| #else
 | |
| typedef enum CBLAS_ORDER {
 | |
|   CblasRowMajor = 101,
 | |
|   CblasColMajor = 102
 | |
| } CBLAS_ORDER;
 | |
| #endif
 | |
| int LAPACKE_sgetrf(
 | |
|     int matrix_layout, int m, int n, float* a, int lda, int* ipiv);
 | |
| int LAPACKE_dgetrf(
 | |
|     int matrix_layout, int m, int n, double* a, int lda, int* ipiv);
 | |
| int LAPACKE_sgetri(
 | |
|     int matrix_layout, int n, float* a, int lda, const int* ipiv);
 | |
| int LAPACKE_dgetri(
 | |
|     int matrix_layout, int n, double* a, int lda, const int* ipiv);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| #include <cmath>
 | |
| 
 | |
| namespace paddle {
 | |
| 
 | |
| #ifndef PADDLE_USE_EIGEN_FOR_BLAS
 | |
| template <class T>
 | |
| void gemm(const CBLAS_TRANSPOSE transA,
 | |
|           const CBLAS_TRANSPOSE transB,
 | |
|           const int M,
 | |
|           const int N,
 | |
|           const int K,
 | |
|           const T alpha,
 | |
|           const T* A,
 | |
|           const int lda,
 | |
|           const T* B,
 | |
|           const int ldb,
 | |
|           const T beta,
 | |
|           T* C,
 | |
|           const int ldc);
 | |
| #endif
 | |
| 
 | |
| template <class T>
 | |
| int getrf(const CBLAS_ORDER Order,
 | |
|           const int M,
 | |
|           const int N,
 | |
|           T* A,
 | |
|           const int lda,
 | |
|           int* ipiv);
 | |
| 
 | |
| template <class T>
 | |
| int getri(
 | |
|     const CBLAS_ORDER Order, const int N, T* A, const int lda, const int* ipiv);
 | |
| 
 | |
| template <class T>
 | |
| void axpy(const int n, const T alpha, const T* x, T* y) {
 | |
|   /// y = y + alpha * x
 | |
|   for (int i = 0; i < n; i++) {
 | |
|     y[i] = y[i] + alpha * x[i];
 | |
|   }
 | |
| }
 | |
| 
 | |
| template <class T>
 | |
| T dotProduct(const int n, const T* x, const T* y) {
 | |
|   T result = static_cast<T>(0);
 | |
|   for (int i = 0; i < n; i++) {
 | |
|     result += x[i] * y[i];
 | |
|   }
 | |
|   return result;
 | |
| }
 | |
| 
 | |
| template <class T>
 | |
| void vExp(const int n, const T* a, T* r);
 | |
| 
 | |
| template <class T>
 | |
| void vPow(const int n, const T* a, const T b, T* r);
 | |
| 
 | |
| template <class T>
 | |
| void vLog(const int n, const T* a, T* r);
 | |
| 
 | |
| template <class T>
 | |
| void vAdd(const int n, const T* a, const T* b, T* r);
 | |
| 
 | |
| template <class T>
 | |
| void vInvSqrt(const int n, const T* a, T* r);
 | |
| 
 | |
| template <class T>
 | |
| void vLog1p(const int n, const T* a, T* r);
 | |
| 
 | |
| template <class T>
 | |
| void vTanh(const int n, const T* a, T* r);
 | |
| 
 | |
| }  // namespace paddle
 | |
| 
 | |
| #endif  // MATHFUNCTIONS_H_
 |