This website works better with JavaScript.
Home
Issues
Pull Requests
Milestones
AI流水线
Repositories
Datasets
Forum
实训
竞赛
大数据
Register
Sign In
OSchip
/
OpenBLAS
Not watched
Unwatch
Watch all
Watch but not notify
1
Star
0
Fork
0
Code
Releases
66
Wiki
evaluate
Activity
Issues
0
Pull Requests
0
Datasets
Model
Cloudbrain
HPC
Browse Source
Fix declaration of arguments in inline assembly
Argument 0 is modified so should be input and output
tags/v0.3.6^2
Martin Kroeker
GitHub
6 years ago
parent
b824fa70eb
commit
ab1630f9fa
No known key found for this signature in database
GPG Key ID:
4AEE18F83AFDEB23
8 changed files
with
18 additions
and
18 deletions
Split View
Diff Options
Show Stats
Download Patch File
Download Diff File
+2
-2
kernel/x86_64/dsymv_L_microk_bulldozer-2.c
+2
-2
kernel/x86_64/dsymv_L_microk_haswell-2.c
+2
-2
kernel/x86_64/dsymv_L_microk_nehalem-2.c
+2
-2
kernel/x86_64/dsymv_L_microk_sandy-2.c
+2
-2
kernel/x86_64/ssymv_L_microk_bulldozer-2.c
+2
-2
kernel/x86_64/ssymv_L_microk_haswell-2.c
+2
-2
kernel/x86_64/ssymv_L_microk_nehalem-2.c
+4
-4
kernel/x86_64/ssymv_L_microk_sandy-2.c
+ 2
- 2
kernel/x86_64/dsymv_L_microk_bulldozer-2.c
View File
@@ -113,8 +113,8 @@ static void dsymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"vmovsd %%xmm3 ,24(%9) \n\t" // save temp2
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
+ 2
- 2
kernel/x86_64/dsymv_L_microk_haswell-2.c
View File
@@ -105,8 +105,8 @@ static void dsymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"vzeroupper \n\t"
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
+ 2
- 2
kernel/x86_64/dsymv_L_microk_nehalem-2.c
View File
@@ -108,8 +108,8 @@ static void dsymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"movsd %%xmm3 , 24(%9) \n\t" // save temp2
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
+ 2
- 2
kernel/x86_64/dsymv_L_microk_sandy-2.c
View File
@@ -114,8 +114,8 @@ static void dsymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"vzeroupper \n\t"
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
+ 2
- 2
kernel/x86_64/ssymv_L_microk_bulldozer-2.c
View File
@@ -98,8 +98,8 @@ static void ssymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"vmovss %%xmm3 ,12(%9) \n\t" // save temp2
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
+ 2
- 2
kernel/x86_64/ssymv_L_microk_haswell-2.c
View File
@@ -99,8 +99,8 @@ static void ssymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"vzeroupper \n\t"
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
+ 2
- 2
kernel/x86_64/ssymv_L_microk_nehalem-2.c
View File
@@ -113,8 +113,8 @@ static void ssymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, F
"movss %%xmm3 , 12(%9) \n\t" // save temp2
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
+ 4
- 4
kernel/x86_64/ssymv_L_microk_sandy-2.c
View File
@@ -109,8 +109,8 @@ static void ssymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"vzeroupper \n\t"
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
@@ -217,8 +217,8 @@ static void ssymv_kernel_4x4(BLASLONG from, BLASLONG to, FLOAT **a, FLOAT *x, FL
"vzeroupper \n\t"
:
:
"r" (from), // 0
"+r" (from) // 0
:
"r" (to), // 1
"r" (x), // 2
"r" (y), // 3
Write
Preview
Loading…
Cancel
Save