@@ -495,6 +495,31 @@ static void __inline blas_lock(volatile BLASULONG *address){ | |||||
#define MMAP_POLICY (MAP_PRIVATE | MAP_ANONYMOUS) | #define MMAP_POLICY (MAP_PRIVATE | MAP_ANONYMOUS) | ||||
#endif | #endif | ||||
/* C99 supports complex floating numbers natively, which GCC also offers as an | |||||
extension since version 3.0. If neither are available, use a compatible | |||||
structure as fallback (see Clause 6.2.5.13 of the C99 standard). */ | |||||
#if ((defined(__STDC_IEC_559_COMPLEX__) || __STDC_VERSION__ >= 199901L || \ | |||||
(__GNUC__ >= 3 && !defined(__cplusplus))) && !(defined(FORCE_OPENBLAS_COMPLEX_STRUCT))) && !defined(_MSC_VER) | |||||
#define OPENBLAS_COMPLEX_C99 | |||||
#ifndef __cplusplus | |||||
#include <complex.h> | |||||
#endif | |||||
typedef float _Complex openblas_complex_float; | |||||
typedef double _Complex openblas_complex_double; | |||||
typedef xdouble _Complex openblas_complex_xdouble; | |||||
#define openblas_make_complex_float(real, imag) ((real) + ((imag) * _Complex_I)) | |||||
#define openblas_make_complex_double(real, imag) ((real) + ((imag) * _Complex_I)) | |||||
#define openblas_make_complex_xdouble(real, imag) ((real) + ((imag) * _Complex_I)) | |||||
#else | |||||
#define OPENBLAS_COMPLEX_STRUCT | |||||
typedef struct { float real, imag; } openblas_complex_float; | |||||
typedef struct { double real, imag; } openblas_complex_double; | |||||
typedef struct { xdouble real, imag; } openblas_complex_xdouble; | |||||
#define openblas_make_complex_float(real, imag) {(real), (imag)} | |||||
#define openblas_make_complex_double(real, imag) {(real), (imag)} | |||||
#define openblas_make_complex_xdouble(real, imag) {(real), (imag)} | |||||
#endif | |||||
#include "param.h" | #include "param.h" | ||||
#include "common_param.h" | #include "common_param.h" | ||||
@@ -524,31 +549,6 @@ static void __inline blas_lock(volatile BLASULONG *address){ | |||||
#include <stdio.h> | #include <stdio.h> | ||||
#endif // NOINCLUDE | #endif // NOINCLUDE | ||||
/* C99 supports complex floating numbers natively, which GCC also offers as an | |||||
extension since version 3.0. If neither are available, use a compatible | |||||
structure as fallback (see Clause 6.2.5.13 of the C99 standard). */ | |||||
#if ((defined(__STDC_IEC_559_COMPLEX__) || __STDC_VERSION__ >= 199901L || \ | |||||
(__GNUC__ >= 3 && !defined(__cplusplus))) && !(defined(FORCE_OPENBLAS_COMPLEX_STRUCT))) | |||||
#define OPENBLAS_COMPLEX_C99 | |||||
#ifndef __cplusplus | |||||
#include <complex.h> | |||||
#endif | |||||
typedef float _Complex openblas_complex_float; | |||||
typedef double _Complex openblas_complex_double; | |||||
typedef xdouble _Complex openblas_complex_xdouble; | |||||
#define openblas_make_complex_float(real, imag) ((real) + ((imag) * _Complex_I)) | |||||
#define openblas_make_complex_double(real, imag) ((real) + ((imag) * _Complex_I)) | |||||
#define openblas_make_complex_xdouble(real, imag) ((real) + ((imag) * _Complex_I)) | |||||
#else | |||||
#define OPENBLAS_COMPLEX_STRUCT | |||||
typedef struct { float real, imag; } openblas_complex_float; | |||||
typedef struct { double real, imag; } openblas_complex_double; | |||||
typedef struct { xdouble real, imag; } openblas_complex_xdouble; | |||||
#define openblas_make_complex_float(real, imag) {(real), (imag)} | |||||
#define openblas_make_complex_double(real, imag) {(real), (imag)} | |||||
#define openblas_make_complex_xdouble(real, imag) {(real), (imag)} | |||||
#endif | |||||
#ifdef XDOUBLE | #ifdef XDOUBLE | ||||
#define OPENBLAS_COMPLEX_FLOAT openblas_complex_xdouble | #define OPENBLAS_COMPLEX_FLOAT openblas_complex_xdouble | ||||
#define OPENBLAS_MAKE_COMPLEX_FLOAT(r,i) openblas_make_complex_xdouble(r,i) | #define OPENBLAS_MAKE_COMPLEX_FLOAT(r,i) openblas_make_complex_xdouble(r,i) | ||||
@@ -333,8 +333,8 @@ BLASLONG (*icamin_k)(BLASLONG, float *, BLASLONG); | |||||
float (*cnrm2_k) (BLASLONG, float *, BLASLONG); | float (*cnrm2_k) (BLASLONG, float *, BLASLONG); | ||||
float (*casum_k) (BLASLONG, float *, BLASLONG); | float (*casum_k) (BLASLONG, float *, BLASLONG); | ||||
int (*ccopy_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG); | int (*ccopy_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG); | ||||
float _Complex (*cdotu_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG); | |||||
float _Complex (*cdotc_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG); | |||||
openblas_complex_float (*cdotu_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG); | |||||
openblas_complex_float (*cdotc_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG); | |||||
int (*csrot_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG, float, float); | int (*csrot_k) (BLASLONG, float *, BLASLONG, float *, BLASLONG, float, float); | ||||
int (*caxpy_k) (BLASLONG, BLASLONG, BLASLONG, float, float, float *, BLASLONG, float *, BLASLONG, float *, BLASLONG); | int (*caxpy_k) (BLASLONG, BLASLONG, BLASLONG, float, float, float *, BLASLONG, float *, BLASLONG, float *, BLASLONG); | ||||
@@ -496,8 +496,8 @@ BLASLONG (*izamin_k)(BLASLONG, double *, BLASLONG); | |||||
double (*znrm2_k) (BLASLONG, double *, BLASLONG); | double (*znrm2_k) (BLASLONG, double *, BLASLONG); | ||||
double (*zasum_k) (BLASLONG, double *, BLASLONG); | double (*zasum_k) (BLASLONG, double *, BLASLONG); | ||||
int (*zcopy_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG); | int (*zcopy_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG); | ||||
double _Complex (*zdotu_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG); | |||||
double _Complex (*zdotc_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG); | |||||
openblas_complex_double (*zdotu_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG); | |||||
openblas_complex_double (*zdotc_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG); | |||||
int (*zdrot_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG, double, double); | int (*zdrot_k) (BLASLONG, double *, BLASLONG, double *, BLASLONG, double, double); | ||||
int (*zaxpy_k) (BLASLONG, BLASLONG, BLASLONG, double, double, double *, BLASLONG, double *, BLASLONG, double *, BLASLONG); | int (*zaxpy_k) (BLASLONG, BLASLONG, BLASLONG, double, double, double *, BLASLONG, double *, BLASLONG, double *, BLASLONG); | ||||
@@ -661,8 +661,8 @@ BLASLONG (*ixamin_k)(BLASLONG, xdouble *, BLASLONG); | |||||
xdouble (*xnrm2_k) (BLASLONG, xdouble *, BLASLONG); | xdouble (*xnrm2_k) (BLASLONG, xdouble *, BLASLONG); | ||||
xdouble (*xasum_k) (BLASLONG, xdouble *, BLASLONG); | xdouble (*xasum_k) (BLASLONG, xdouble *, BLASLONG); | ||||
int (*xcopy_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | int (*xcopy_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | ||||
xdouble _Complex (*xdotu_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | |||||
xdouble _Complex (*xdotc_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | |||||
openblas_complex_xdouble (*xdotu_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | |||||
openblas_complex_xdouble (*xdotc_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | |||||
int (*xqrot_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG, xdouble, xdouble); | int (*xqrot_k) (BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG, xdouble, xdouble); | ||||
int (*xaxpy_k) (BLASLONG, BLASLONG, BLASLONG, xdouble, xdouble, xdouble *, BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | int (*xaxpy_k) (BLASLONG, BLASLONG, BLASLONG, xdouble, xdouble, xdouble *, BLASLONG, xdouble *, BLASLONG, xdouble *, BLASLONG); | ||||
@@ -91,16 +91,15 @@ static void cdot_kernel_16(BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *d) | |||||
#endif | #endif | ||||
FLOAT _Complex CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y) | |||||
OPENBLAS_COMPLEX_FLOAT CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y) | |||||
{ | { | ||||
BLASLONG i; | BLASLONG i; | ||||
BLASLONG ix,iy; | BLASLONG ix,iy; | ||||
FLOAT _Complex result; | |||||
FLOAT dot[8] = { 0.0, 0.0, 0.0 , 0.0, 0.0, 0.0, 0.0, 0.0 } ; | FLOAT dot[8] = { 0.0, 0.0, 0.0 , 0.0, 0.0, 0.0, 0.0, 0.0 } ; | ||||
if ( n <= 0 ) | if ( n <= 0 ) | ||||
{ | { | ||||
result = OPENBLAS_MAKE_COMPLEX_FLOAT (0.0, 0.0) ; | |||||
OPENBLAS_COMPLEX_FLOAT result = OPENBLAS_MAKE_COMPLEX_FLOAT (0.0, 0.0) ; | |||||
return(result); | return(result); | ||||
} | } | ||||
@@ -160,11 +159,11 @@ FLOAT _Complex CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG in | |||||
} | } | ||||
#if !defined(CONJ) | #if !defined(CONJ) | ||||
result = OPENBLAS_MAKE_COMPLEX_FLOAT (dot[0]-dot[1], dot[4]+dot[5]) ; | |||||
OPENBLAS_COMPLEX_FLOAT result = OPENBLAS_MAKE_COMPLEX_FLOAT (dot[0]-dot[1], dot[4]+dot[5]) ; | |||||
// CREAL(result) = dot[0] - dot[1]; | // CREAL(result) = dot[0] - dot[1]; | ||||
// CIMAG(result) = dot[4] + dot[5]; | // CIMAG(result) = dot[4] + dot[5]; | ||||
#else | #else | ||||
result = OPENBLAS_MAKE_COMPLEX_FLOAT (dot[0]+dot[1], dot[4]-dot[5]) ; | |||||
OPENBLAS_COMPLEX_FLOAT result = OPENBLAS_MAKE_COMPLEX_FLOAT (dot[0]+dot[1], dot[4]-dot[5]) ; | |||||
// CREAL(result) = dot[0] + dot[1]; | // CREAL(result) = dot[0] + dot[1]; | ||||
// CIMAG(result) = dot[4] - dot[5]; | // CIMAG(result) = dot[4] - dot[5]; | ||||
@@ -86,18 +86,17 @@ static void zdot_kernel_8(BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *d) | |||||
#endif | #endif | ||||
FLOAT _Complex CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y) | |||||
OPENBLAS_COMPLEX_FLOAT CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG inc_y) | |||||
{ | { | ||||
BLASLONG i; | BLASLONG i; | ||||
BLASLONG ix,iy; | BLASLONG ix,iy; | ||||
FLOAT _Complex result; | |||||
FLOAT dot[4] = { 0.0, 0.0, 0.0 , 0.0 } ; | FLOAT dot[4] = { 0.0, 0.0, 0.0 , 0.0 } ; | ||||
if ( n <= 0 ) | if ( n <= 0 ) | ||||
{ | { | ||||
// CREAL(result) = 0.0 ; | // CREAL(result) = 0.0 ; | ||||
// CIMAG(result) = 0.0 ; | // CIMAG(result) = 0.0 ; | ||||
result=OPENBLAS_MAKE_COMPLEX_FLOAT(0.0,0.0); | |||||
OPENBLAS_COMPLEX_FLOAT result=OPENBLAS_MAKE_COMPLEX_FLOAT(0.0,0.0); | |||||
return(result); | return(result); | ||||
} | } | ||||
@@ -151,11 +150,11 @@ FLOAT _Complex CNAME(BLASLONG n, FLOAT *x, BLASLONG inc_x, FLOAT *y, BLASLONG in | |||||
} | } | ||||
#if !defined(CONJ) | #if !defined(CONJ) | ||||
result=OPENBLAS_MAKE_COMPLEX_FLOAT(dot[0]-dot[1],dot[2]+dot[3]); | |||||
OPENBLAS_COMPLEX_FLOAT result=OPENBLAS_MAKE_COMPLEX_FLOAT(dot[0]-dot[1],dot[2]+dot[3]); | |||||
// CREAL(result) = dot[0] - dot[1]; | // CREAL(result) = dot[0] - dot[1]; | ||||
// CIMAG(result) = dot[2] + dot[3]; | // CIMAG(result) = dot[2] + dot[3]; | ||||
#else | #else | ||||
result=OPENBLAS_MAKE_COMPLEX_FLOAT(dot[0]+dot[1],dot[2]-dot[3]); | |||||
OPENBLAS_COMPLEX_FLOAT result=OPENBLAS_MAKE_COMPLEX_FLOAT(dot[0]+dot[1],dot[2]-dot[3]); | |||||
// CREAL(result) = dot[0] + dot[1]; | // CREAL(result) = dot[0] + dot[1]; | ||||
// CIMAG(result) = dot[2] - dot[3]; | // CIMAG(result) = dot[2] - dot[3]; | ||||
@@ -59,7 +59,7 @@ typedef int blasint; | |||||
extension since version 3.0. If neither are available, use a compatible | extension since version 3.0. If neither are available, use a compatible | ||||
structure as fallback (see Clause 6.2.5.13 of the C99 standard). */ | structure as fallback (see Clause 6.2.5.13 of the C99 standard). */ | ||||
#if ((defined(__STDC_IEC_559_COMPLEX__) || __STDC_VERSION__ >= 199901L || \ | #if ((defined(__STDC_IEC_559_COMPLEX__) || __STDC_VERSION__ >= 199901L || \ | ||||
(__GNUC__ >= 3 && !defined(__cplusplus))) && !(defined(FORCE_OPENBLAS_COMPLEX_STRUCT))) | |||||
(__GNUC__ >= 3 && !defined(__cplusplus))) && !(defined(FORCE_OPENBLAS_COMPLEX_STRUCT))) && !defined(_MSC_VER) | |||||
#define OPENBLAS_COMPLEX_C99 | #define OPENBLAS_COMPLEX_C99 | ||||
#ifndef __cplusplus | #ifndef __cplusplus | ||||
#include <complex.h> | #include <complex.h> | ||||