We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents 8e20ab2 + b073d75 commit ee83e29Copy full SHA for ee83e29
22 files changed
kernel/x86_64/caxpy_microk_bulldozer-2.c
@@ -122,7 +122,7 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
122
"r" (alpha), // 4
123
"r" (mvec) // 5
124
: "cc",
125
- "%xmm0", "%xmm1",
+ "%xmm0", "%xmm1", "%xmm2", "%xmm3",
126
"%xmm4", "%xmm5", "%xmm6", "%xmm7",
127
"%xmm8", "%xmm9", "%xmm10", "%xmm11",
128
"%xmm12", "%xmm13", "%xmm14", "%xmm15",
@@ -189,9 +189,10 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
189
190
191
192
193
194
195
+ "%xmm12", "%xmm13", "%xmm14", "%xmm15",
196
"memory"
197
);
198
kernel/x86_64/caxpy_microk_haswell-2.c
@@ -120,7 +120,7 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
120
121
kernel/x86_64/caxpy_microk_sandy-2.c
@@ -104,7 +104,7 @@ static void caxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
104
105
106
107
108
109
110
kernel/x86_64/caxpy_microk_steamroller-2.c
kernel/x86_64/daxpy_microk_haswell-2.c
@@ -67,8 +67,9 @@ static void daxpy_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *alpha)
67
"r" (y), // 3
68
"r" (alpha) // 4
69
70
- "%xmm0",
71
- "%xmm8", "%xmm9", "%xmm10", "%xmm11",
+ "%xmm4", "%xmm5", "%xmm6", "%xmm7",
72
+ "%xmm8", "%xmm9", "%xmm10", "%xmm11",
73
74
75
kernel/x86_64/ddot_microk_haswell-2.c
@@ -84,8 +84,9 @@ static void ddot_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
84
85
"r" (dot) // 4
86
87
- "%xmm4", "%xmm5",
88
- "%xmm6", "%xmm7",
89
90
91
92
kernel/x86_64/ddot_microk_piledriver-2.c
@@ -91,6 +91,7 @@ static void ddot_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
"%xmm0", "%xmm1", "%xmm2", "%xmm3",
93
94
95
96
97
@@ -155,6 +156,7 @@ static void ddot_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
155
156
157
158
159
160
161
162
kernel/x86_64/ddot_microk_sandy-2.c
@@ -89,8 +89,9 @@ static void ddot_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
kernel/x86_64/ddot_microk_steamroller-2.c
@@ -88,6 +88,7 @@ static void ddot_kernel_8( BLASLONG n, FLOAT *x, FLOAT *y, FLOAT *dot)
kernel/x86_64/dgemv_n_microk_haswell-4.c
@@ -105,9 +105,8 @@ static void dgemv_kernel_4x4( BLASLONG n, FLOAT **ap, FLOAT *x, FLOAT *y, FLOAT
"r" (alpha) // 8
- "%xmm8", "%xmm9",
111
112
113
@@ -182,11 +181,10 @@ static void dgemv_kernel_4x2( BLASLONG n, FLOAT **ap, FLOAT *x, FLOAT *y, FLOAT
182
181
"r" (ap[1]), // 5
183
"r" (alpha) // 6
184
185
186
187
- "%xmm6",
188
- "%xmm8",
- "%xmm12", "%xmm13",
}
0 commit comments