/root/doris/contrib/openblas/common_s.h
Line | Count | Source |
1 | | #ifndef COMMON_S_H |
2 | | #define COMMON_S_H |
3 | | |
4 | | #ifndef DYNAMIC_ARCH |
5 | | |
6 | | #define SAMAX_K samax_k |
7 | 0 | #define SAMIN_K samin_k |
8 | | #define SMAX_K smax_k |
9 | | #define SMIN_K smin_k |
10 | 0 | #define ISAMAX_K isamax_k |
11 | 0 | #define ISAMIN_K isamin_k |
12 | | #define ISMAX_K ismax_k |
13 | | #define ISMIN_K ismin_k |
14 | | #define SASUM_K sasum_k |
15 | | #define SSUM_K ssum_k |
16 | 0 | #define SAXPYU_K saxpy_k |
17 | | #define SAXPYC_K saxpy_k |
18 | 0 | #define SCOPY_K scopy_k |
19 | 0 | #define SDOTU_K sdot_k |
20 | | #define SDOTC_K sdot_k |
21 | | #define SDSDOT_K dsdot_k |
22 | | #define DSDOT_K dsdot_k |
23 | 0 | #define SNRM2_K snrm2_k |
24 | 0 | #define SSCAL_K sscal_k |
25 | 0 | #define SSWAP_K sswap_k |
26 | 0 | #define SROT_K srot_k |
27 | | #define SROTM_K srotm_k |
28 | | |
29 | 0 | #define SGEMV_N sgemv_n |
30 | 0 | #define SGEMV_T sgemv_t |
31 | | #define SGEMV_R sgemv_n |
32 | | #define SGEMV_C sgemv_t |
33 | | #define SGEMV_O sgemv_n |
34 | | #define SGEMV_U sgemv_t |
35 | | #define SGEMV_S sgemv_n |
36 | | #define SGEMV_D sgemv_t |
37 | | |
38 | 0 | #define SGERU_K sger_k |
39 | | #define SGERC_K sger_k |
40 | | #define SGERV_K sger_k |
41 | | #define SGERD_K sger_k |
42 | | |
43 | | #define SSYMV_U ssymv_U |
44 | | #define SSYMV_L ssymv_L |
45 | | |
46 | | #define SSYMV_THREAD_U ssymv_thread_U |
47 | | #define SSYMV_THREAD_L ssymv_thread_L |
48 | | |
49 | | |
50 | | #define SGEMM_DIRECT_PERFORMANT sgemm_direct_performant |
51 | | #define SGEMM_DIRECT sgemm_direct |
52 | | |
53 | 0 | #define SGEMM_ONCOPY sgemm_oncopy |
54 | 0 | #define SGEMM_OTCOPY sgemm_otcopy |
55 | | |
56 | | #if SGEMM_DEFAULT_UNROLL_M == SGEMM_DEFAULT_UNROLL_N |
57 | | #define SGEMM_INCOPY sgemm_oncopy |
58 | | #define SGEMM_ITCOPY sgemm_otcopy |
59 | | #else |
60 | 0 | #define SGEMM_INCOPY sgemm_incopy |
61 | 0 | #define SGEMM_ITCOPY sgemm_itcopy |
62 | | #endif |
63 | | |
64 | 0 | #define STRMM_OUNUCOPY strmm_ounucopy |
65 | 0 | #define STRMM_OUNNCOPY strmm_ounncopy |
66 | 0 | #define STRMM_OUTUCOPY strmm_outucopy |
67 | 0 | #define STRMM_OUTNCOPY strmm_outncopy |
68 | 0 | #define STRMM_OLNUCOPY strmm_olnucopy |
69 | 0 | #define STRMM_OLNNCOPY strmm_olnncopy |
70 | 0 | #define STRMM_OLTUCOPY strmm_oltucopy |
71 | 0 | #define STRMM_OLTNCOPY strmm_oltncopy |
72 | | |
73 | 0 | #define STRSM_OUNUCOPY strsm_ounucopy |
74 | 0 | #define STRSM_OUNNCOPY strsm_ounncopy |
75 | 0 | #define STRSM_OUTUCOPY strsm_outucopy |
76 | 0 | #define STRSM_OUTNCOPY strsm_outncopy |
77 | 0 | #define STRSM_OLNUCOPY strsm_olnucopy |
78 | 0 | #define STRSM_OLNNCOPY strsm_olnncopy |
79 | 0 | #define STRSM_OLTUCOPY strsm_oltucopy |
80 | 0 | #define STRSM_OLTNCOPY strsm_oltncopy |
81 | | |
82 | | #if SGEMM_DEFAULT_UNROLL_M == SGEMM_DEFAULT_UNROLL_N |
83 | | #define STRMM_IUNUCOPY strmm_ounucopy |
84 | | #define STRMM_IUNNCOPY strmm_ounncopy |
85 | | #define STRMM_IUTUCOPY strmm_outucopy |
86 | | #define STRMM_IUTNCOPY strmm_outncopy |
87 | | #define STRMM_ILNUCOPY strmm_olnucopy |
88 | | #define STRMM_ILNNCOPY strmm_olnncopy |
89 | | #define STRMM_ILTUCOPY strmm_oltucopy |
90 | | #define STRMM_ILTNCOPY strmm_oltncopy |
91 | | |
92 | | #define STRSM_IUNUCOPY strsm_ounucopy |
93 | | #define STRSM_IUNNCOPY strsm_ounncopy |
94 | | #define STRSM_IUTUCOPY strsm_outucopy |
95 | | #define STRSM_IUTNCOPY strsm_outncopy |
96 | | #define STRSM_ILNUCOPY strsm_olnucopy |
97 | | #define STRSM_ILNNCOPY strsm_olnncopy |
98 | | #define STRSM_ILTUCOPY strsm_oltucopy |
99 | | #define STRSM_ILTNCOPY strsm_oltncopy |
100 | | #else |
101 | 0 | #define STRMM_IUNUCOPY strmm_iunucopy |
102 | 0 | #define STRMM_IUNNCOPY strmm_iunncopy |
103 | 0 | #define STRMM_IUTUCOPY strmm_iutucopy |
104 | 0 | #define STRMM_IUTNCOPY strmm_iutncopy |
105 | 0 | #define STRMM_ILNUCOPY strmm_ilnucopy |
106 | 0 | #define STRMM_ILNNCOPY strmm_ilnncopy |
107 | 0 | #define STRMM_ILTUCOPY strmm_iltucopy |
108 | 0 | #define STRMM_ILTNCOPY strmm_iltncopy |
109 | | |
110 | 0 | #define STRSM_IUNUCOPY strsm_iunucopy |
111 | 0 | #define STRSM_IUNNCOPY strsm_iunncopy |
112 | 0 | #define STRSM_IUTUCOPY strsm_iutucopy |
113 | 0 | #define STRSM_IUTNCOPY strsm_iutncopy |
114 | 0 | #define STRSM_ILNUCOPY strsm_ilnucopy |
115 | 0 | #define STRSM_ILNNCOPY strsm_ilnncopy |
116 | 0 | #define STRSM_ILTUCOPY strsm_iltucopy |
117 | 0 | #define STRSM_ILTNCOPY strsm_iltncopy |
118 | | #endif |
119 | | |
120 | 0 | #define SGEMM_BETA sgemm_beta |
121 | | |
122 | 0 | #define SGEMM_KERNEL sgemm_kernel |
123 | | |
124 | 0 | #define STRMM_KERNEL_LN strmm_kernel_LN |
125 | 0 | #define STRMM_KERNEL_LT strmm_kernel_LT |
126 | | #define STRMM_KERNEL_LR strmm_kernel_LN |
127 | | #define STRMM_KERNEL_LC strmm_kernel_LT |
128 | 0 | #define STRMM_KERNEL_RN strmm_kernel_RN |
129 | 0 | #define STRMM_KERNEL_RT strmm_kernel_RT |
130 | | #define STRMM_KERNEL_RR strmm_kernel_RN |
131 | | #define STRMM_KERNEL_RC strmm_kernel_RT |
132 | | |
133 | 0 | #define STRSM_KERNEL_LN strsm_kernel_LN |
134 | 0 | #define STRSM_KERNEL_LT strsm_kernel_LT |
135 | | #define STRSM_KERNEL_LR strsm_kernel_LN |
136 | | #define STRSM_KERNEL_LC strsm_kernel_LT |
137 | 0 | #define STRSM_KERNEL_RN strsm_kernel_RN |
138 | 0 | #define STRSM_KERNEL_RT strsm_kernel_RT |
139 | | #define STRSM_KERNEL_RR strsm_kernel_RN |
140 | | #define STRSM_KERNEL_RC strsm_kernel_RT |
141 | | |
142 | | #define SSYMM_OUTCOPY ssymm_outcopy |
143 | | #define SSYMM_OLTCOPY ssymm_oltcopy |
144 | | #if SGEMM_DEFAULT_UNROLL_M == SGEMM_DEFAULT_UNROLL_N |
145 | | #define SSYMM_IUTCOPY ssymm_outcopy |
146 | | #define SSYMM_ILTCOPY ssymm_oltcopy |
147 | | #else |
148 | | #define SSYMM_IUTCOPY ssymm_iutcopy |
149 | | #define SSYMM_ILTCOPY ssymm_iltcopy |
150 | | #endif |
151 | | |
152 | | #define SNEG_TCOPY sneg_tcopy |
153 | | #define SLASWP_NCOPY slaswp_ncopy |
154 | | |
155 | | #define SAXPBY_K saxpby_k |
156 | | |
157 | | #define SOMATCOPY_K_CN somatcopy_k_cn |
158 | | #define SOMATCOPY_K_RN somatcopy_k_rn |
159 | | #define SOMATCOPY_K_CT somatcopy_k_ct |
160 | | #define SOMATCOPY_K_RT somatcopy_k_rt |
161 | | #define SIMATCOPY_K_CN simatcopy_k_cn |
162 | | #define SIMATCOPY_K_RN simatcopy_k_rn |
163 | | #define SIMATCOPY_K_CT simatcopy_k_ct |
164 | | #define SIMATCOPY_K_RT simatcopy_k_rt |
165 | | |
166 | | #define SGEADD_K sgeadd_k |
167 | | |
168 | 0 | #define SGEMM_SMALL_MATRIX_PERMIT sgemm_small_matrix_permit |
169 | | |
170 | | #else |
171 | | |
172 | | #define SAMAX_K gotoblas -> samax_k |
173 | | #define SAMIN_K gotoblas -> samin_k |
174 | | #define SMAX_K gotoblas -> smax_k |
175 | | #define SMIN_K gotoblas -> smin_k |
176 | | #define ISAMAX_K gotoblas -> isamax_k |
177 | | #define ISAMIN_K gotoblas -> isamin_k |
178 | | #define ISMAX_K gotoblas -> ismax_k |
179 | | #define ISMIN_K gotoblas -> ismin_k |
180 | | #define SASUM_K gotoblas -> sasum_k |
181 | | #define SSUM_K gotoblas -> ssum_k |
182 | | #define SAXPYU_K gotoblas -> saxpy_k |
183 | | #define SAXPYC_K gotoblas -> saxpy_k |
184 | | #define SCOPY_K gotoblas -> scopy_k |
185 | | #define SDOTU_K gotoblas -> sdot_k |
186 | | #define SDOTC_K gotoblas -> sdot_k |
187 | | #define SDSDOT_K gotoblas -> dsdot_k |
188 | | #define DSDOT_K gotoblas -> dsdot_k |
189 | | #define SNRM2_K gotoblas -> snrm2_k |
190 | | #define SSCAL_K gotoblas -> sscal_k |
191 | | #define SSWAP_K gotoblas -> sswap_k |
192 | | #define SROT_K gotoblas -> srot_k |
193 | | #define SROTM_K gotoblas -> srotm_k |
194 | | |
195 | | #define SGEMV_N gotoblas -> sgemv_n |
196 | | #define SGEMV_T gotoblas -> sgemv_t |
197 | | #define SGEMV_R gotoblas -> sgemv_n |
198 | | #define SGEMV_C gotoblas -> sgemv_t |
199 | | #define SGEMV_O gotoblas -> sgemv_n |
200 | | #define SGEMV_U gotoblas -> sgemv_t |
201 | | #define SGEMV_S gotoblas -> sgemv_n |
202 | | #define SGEMV_D gotoblas -> sgemv_t |
203 | | |
204 | | #define SGERU_K gotoblas -> sger_k |
205 | | #define SGERC_K gotoblas -> sger_k |
206 | | #define SGERV_K gotoblas -> sger_k |
207 | | #define SGERD_K gotoblas -> sger_k |
208 | | |
209 | | #define SSYMV_U gotoblas -> ssymv_U |
210 | | #define SSYMV_L gotoblas -> ssymv_L |
211 | | |
212 | | #define SSYMV_THREAD_U ssymv_thread_U |
213 | | #define SSYMV_THREAD_L ssymv_thread_L |
214 | | |
215 | | #ifdef ARCH_X86_64 |
216 | | #define SGEMM_DIRECT_PERFORMANT gotoblas -> sgemm_direct_performant |
217 | | #define SGEMM_DIRECT gotoblas -> sgemm_direct |
218 | | #elif ARCH_ARM64 |
219 | | #define SGEMM_DIRECT_PERFORMANT sgemm_direct_performant |
220 | | #define SGEMM_DIRECT gotoblas -> sgemm_direct |
221 | | #endif |
222 | | |
223 | | #define SGEMM_ONCOPY gotoblas -> sgemm_oncopy |
224 | | #define SGEMM_OTCOPY gotoblas -> sgemm_otcopy |
225 | | #define SGEMM_INCOPY gotoblas -> sgemm_incopy |
226 | | #define SGEMM_ITCOPY gotoblas -> sgemm_itcopy |
227 | | |
228 | | #define STRMM_OUNUCOPY gotoblas -> strmm_ounucopy |
229 | | #define STRMM_OUTUCOPY gotoblas -> strmm_outucopy |
230 | | #define STRMM_OLNUCOPY gotoblas -> strmm_olnucopy |
231 | | #define STRMM_OLTUCOPY gotoblas -> strmm_oltucopy |
232 | | #define STRSM_OUNUCOPY gotoblas -> strsm_ounucopy |
233 | | #define STRSM_OUTUCOPY gotoblas -> strsm_outucopy |
234 | | #define STRSM_OLNUCOPY gotoblas -> strsm_olnucopy |
235 | | #define STRSM_OLTUCOPY gotoblas -> strsm_oltucopy |
236 | | |
237 | | #define STRMM_IUNUCOPY gotoblas -> strmm_iunucopy |
238 | | #define STRMM_IUTUCOPY gotoblas -> strmm_iutucopy |
239 | | #define STRMM_ILNUCOPY gotoblas -> strmm_ilnucopy |
240 | | #define STRMM_ILTUCOPY gotoblas -> strmm_iltucopy |
241 | | #define STRSM_IUNUCOPY gotoblas -> strsm_iunucopy |
242 | | #define STRSM_IUTUCOPY gotoblas -> strsm_iutucopy |
243 | | #define STRSM_ILNUCOPY gotoblas -> strsm_ilnucopy |
244 | | #define STRSM_ILTUCOPY gotoblas -> strsm_iltucopy |
245 | | |
246 | | #define STRMM_OUNNCOPY gotoblas -> strmm_ounncopy |
247 | | #define STRMM_OUTNCOPY gotoblas -> strmm_outncopy |
248 | | #define STRMM_OLNNCOPY gotoblas -> strmm_olnncopy |
249 | | #define STRMM_OLTNCOPY gotoblas -> strmm_oltncopy |
250 | | #define STRSM_OUNNCOPY gotoblas -> strsm_ounncopy |
251 | | #define STRSM_OUTNCOPY gotoblas -> strsm_outncopy |
252 | | #define STRSM_OLNNCOPY gotoblas -> strsm_olnncopy |
253 | | #define STRSM_OLTNCOPY gotoblas -> strsm_oltncopy |
254 | | |
255 | | #define STRMM_IUNNCOPY gotoblas -> strmm_iunncopy |
256 | | #define STRMM_IUTNCOPY gotoblas -> strmm_iutncopy |
257 | | #define STRMM_ILNNCOPY gotoblas -> strmm_ilnncopy |
258 | | #define STRMM_ILTNCOPY gotoblas -> strmm_iltncopy |
259 | | #define STRSM_IUNNCOPY gotoblas -> strsm_iunncopy |
260 | | #define STRSM_IUTNCOPY gotoblas -> strsm_iutncopy |
261 | | #define STRSM_ILNNCOPY gotoblas -> strsm_ilnncopy |
262 | | #define STRSM_ILTNCOPY gotoblas -> strsm_iltncopy |
263 | | |
264 | | #define SGEMM_BETA gotoblas -> sgemm_beta |
265 | | #define SGEMM_KERNEL gotoblas -> sgemm_kernel |
266 | | |
267 | | #define STRMM_KERNEL_LN gotoblas -> strmm_kernel_LN |
268 | | #define STRMM_KERNEL_LT gotoblas -> strmm_kernel_LT |
269 | | #define STRMM_KERNEL_LR gotoblas -> strmm_kernel_LN |
270 | | #define STRMM_KERNEL_LC gotoblas -> strmm_kernel_LT |
271 | | #define STRMM_KERNEL_RN gotoblas -> strmm_kernel_RN |
272 | | #define STRMM_KERNEL_RT gotoblas -> strmm_kernel_RT |
273 | | #define STRMM_KERNEL_RR gotoblas -> strmm_kernel_RN |
274 | | #define STRMM_KERNEL_RC gotoblas -> strmm_kernel_RT |
275 | | |
276 | | #define STRSM_KERNEL_LN gotoblas -> strsm_kernel_LN |
277 | | #define STRSM_KERNEL_LT gotoblas -> strsm_kernel_LT |
278 | | #define STRSM_KERNEL_LR gotoblas -> strsm_kernel_LN |
279 | | #define STRSM_KERNEL_LC gotoblas -> strsm_kernel_LT |
280 | | #define STRSM_KERNEL_RN gotoblas -> strsm_kernel_RN |
281 | | #define STRSM_KERNEL_RT gotoblas -> strsm_kernel_RT |
282 | | #define STRSM_KERNEL_RR gotoblas -> strsm_kernel_RN |
283 | | #define STRSM_KERNEL_RC gotoblas -> strsm_kernel_RT |
284 | | |
285 | | #define SSYMM_IUTCOPY gotoblas -> ssymm_iutcopy |
286 | | #define SSYMM_ILTCOPY gotoblas -> ssymm_iltcopy |
287 | | #define SSYMM_OUTCOPY gotoblas -> ssymm_outcopy |
288 | | #define SSYMM_OLTCOPY gotoblas -> ssymm_oltcopy |
289 | | |
290 | | #define SNEG_TCOPY gotoblas -> sneg_tcopy |
291 | | #define SLASWP_NCOPY gotoblas -> slaswp_ncopy |
292 | | |
293 | | #define SAXPBY_K gotoblas -> saxpby_k |
294 | | |
295 | | #define SOMATCOPY_K_CN gotoblas -> somatcopy_k_cn |
296 | | #define SOMATCOPY_K_RN gotoblas -> somatcopy_k_rn |
297 | | #define SOMATCOPY_K_CT gotoblas -> somatcopy_k_ct |
298 | | #define SOMATCOPY_K_RT gotoblas -> somatcopy_k_rt |
299 | | #define SIMATCOPY_K_CN gotoblas -> simatcopy_k_cn |
300 | | #define SIMATCOPY_K_RN gotoblas -> simatcopy_k_rn |
301 | | #define SIMATCOPY_K_CT gotoblas -> simatcopy_k_ct |
302 | | #define SIMATCOPY_K_RT gotoblas -> simatcopy_k_rt |
303 | | |
304 | | #define SGEADD_K gotoblas -> sgeadd_k |
305 | | |
306 | | #define SGEMM_SMALL_MATRIX_PERMIT gotoblas -> sgemm_small_matrix_permit |
307 | | |
308 | | #endif |
309 | | |
310 | | #define SGEMM_SMALL_KERNEL_NN FUNC_OFFSET(sgemm_small_kernel_nn) |
311 | | #define SGEMM_SMALL_KERNEL_NT FUNC_OFFSET(sgemm_small_kernel_nt) |
312 | | #define SGEMM_SMALL_KERNEL_TN FUNC_OFFSET(sgemm_small_kernel_tn) |
313 | | #define SGEMM_SMALL_KERNEL_TT FUNC_OFFSET(sgemm_small_kernel_tt) |
314 | | |
315 | | #define SGEMM_SMALL_KERNEL_B0_NN FUNC_OFFSET(sgemm_small_kernel_b0_nn) |
316 | | #define SGEMM_SMALL_KERNEL_B0_NT FUNC_OFFSET(sgemm_small_kernel_b0_nt) |
317 | | #define SGEMM_SMALL_KERNEL_B0_TN FUNC_OFFSET(sgemm_small_kernel_b0_tn) |
318 | | #define SGEMM_SMALL_KERNEL_B0_TT FUNC_OFFSET(sgemm_small_kernel_b0_tt) |
319 | | |
320 | | |
321 | 0 | #define SGEMM_NN sgemm_nn |
322 | | #define SGEMM_CN sgemm_tn |
323 | 0 | #define SGEMM_TN sgemm_tn |
324 | | #define SGEMM_NC sgemm_nt |
325 | 0 | #define SGEMM_NT sgemm_nt |
326 | | #define SGEMM_CC sgemm_tt |
327 | | #define SGEMM_CT sgemm_tt |
328 | | #define SGEMM_TC sgemm_tt |
329 | 0 | #define SGEMM_TT sgemm_tt |
330 | | #define SGEMM_NR sgemm_nn |
331 | | #define SGEMM_TR sgemm_tn |
332 | | #define SGEMM_CR sgemm_tn |
333 | | #define SGEMM_RN sgemm_nn |
334 | | #define SGEMM_RT sgemm_nt |
335 | | #define SGEMM_RC sgemm_nt |
336 | | #define SGEMM_RR sgemm_nn |
337 | | |
338 | | #define SSYMM_LU ssymm_LU |
339 | | #define SSYMM_LL ssymm_LL |
340 | | #define SSYMM_RU ssymm_RU |
341 | | #define SSYMM_RL ssymm_RL |
342 | | |
343 | | #define SHEMM_LU shemm_LU |
344 | | #define SHEMM_LL shemm_LL |
345 | | #define SHEMM_RU shemm_RU |
346 | | #define SHEMM_RL shemm_RL |
347 | | |
348 | 0 | #define SSYRK_UN ssyrk_UN |
349 | 0 | #define SSYRK_UT ssyrk_UT |
350 | 0 | #define SSYRK_LN ssyrk_LN |
351 | 0 | #define SSYRK_LT ssyrk_LT |
352 | | #define SSYRK_UR ssyrk_UN |
353 | | #define SSYRK_UC ssyrk_UT |
354 | | #define SSYRK_LR ssyrk_LN |
355 | | #define SSYRK_LC ssyrk_LT |
356 | | |
357 | 0 | #define SSYRK_KERNEL_U ssyrk_kernel_U |
358 | 0 | #define SSYRK_KERNEL_L ssyrk_kernel_L |
359 | | |
360 | | #define SHERK_UN ssyrk_UN |
361 | | #define SHERK_LN ssyrk_LN |
362 | | #define SHERK_UC ssyrk_UT |
363 | | #define SHERK_LC ssyrk_LT |
364 | | |
365 | | #define SHER2K_UN ssyr2k_UN |
366 | | #define SHER2K_LN ssyr2k_LN |
367 | | #define SHER2K_UC ssyr2k_UT |
368 | | #define SHER2K_LC ssyr2k_LT |
369 | | |
370 | | #define SSYR2K_UN ssyr2k_UN |
371 | | #define SSYR2K_UT ssyr2k_UT |
372 | | #define SSYR2K_LN ssyr2k_LN |
373 | | #define SSYR2K_LT ssyr2k_LT |
374 | | #define SSYR2K_UR ssyr2k_UN |
375 | | #define SSYR2K_UC ssyr2k_UT |
376 | | #define SSYR2K_LR ssyr2k_LN |
377 | | #define SSYR2K_LC ssyr2k_LT |
378 | | |
379 | | #define SSYR2K_KERNEL_U ssyr2k_kernel_U |
380 | | #define SSYR2K_KERNEL_L ssyr2k_kernel_L |
381 | | |
382 | 0 | #define STRMM_LNUU strmm_LNUU |
383 | 0 | #define STRMM_LNUN strmm_LNUN |
384 | 0 | #define STRMM_LNLU strmm_LNLU |
385 | 0 | #define STRMM_LNLN strmm_LNLN |
386 | | #define STRMM_LTUU strmm_LTUU |
387 | | #define STRMM_LTUN strmm_LTUN |
388 | | #define STRMM_LTLU strmm_LTLU |
389 | | #define STRMM_LTLN strmm_LTLN |
390 | | #define STRMM_LRUU strmm_LNUU |
391 | | #define STRMM_LRUN strmm_LNUN |
392 | | #define STRMM_LRLU strmm_LNLU |
393 | | #define STRMM_LRLN strmm_LNLN |
394 | | #define STRMM_LCUU strmm_LTUU |
395 | | #define STRMM_LCUN strmm_LTUN |
396 | | #define STRMM_LCLU strmm_LTLU |
397 | | #define STRMM_LCLN strmm_LTLN |
398 | | #define STRMM_RNUU strmm_RNUU |
399 | | #define STRMM_RNUN strmm_RNUN |
400 | | #define STRMM_RNLU strmm_RNLU |
401 | | #define STRMM_RNLN strmm_RNLN |
402 | | #define STRMM_RTUU strmm_RTUU |
403 | | #define STRMM_RTUN strmm_RTUN |
404 | | #define STRMM_RTLU strmm_RTLU |
405 | | #define STRMM_RTLN strmm_RTLN |
406 | | #define STRMM_RRUU strmm_RNUU |
407 | | #define STRMM_RRUN strmm_RNUN |
408 | | #define STRMM_RRLU strmm_RNLU |
409 | | #define STRMM_RRLN strmm_RNLN |
410 | | #define STRMM_RCUU strmm_RTUU |
411 | | #define STRMM_RCUN strmm_RTUN |
412 | | #define STRMM_RCLU strmm_RTLU |
413 | | #define STRMM_RCLN strmm_RTLN |
414 | | |
415 | | #define STRSM_LNUU strsm_LNUU |
416 | | #define STRSM_LNUN strsm_LNUN |
417 | | #define STRSM_LNLU strsm_LNLU |
418 | | #define STRSM_LNLN strsm_LNLN |
419 | | #define STRSM_LTUU strsm_LTUU |
420 | | #define STRSM_LTUN strsm_LTUN |
421 | | #define STRSM_LTLU strsm_LTLU |
422 | | #define STRSM_LTLN strsm_LTLN |
423 | | #define STRSM_LRUU strsm_LNUU |
424 | | #define STRSM_LRUN strsm_LNUN |
425 | | #define STRSM_LRLU strsm_LNLU |
426 | | #define STRSM_LRLN strsm_LNLN |
427 | | #define STRSM_LCUU strsm_LTUU |
428 | | #define STRSM_LCUN strsm_LTUN |
429 | | #define STRSM_LCLU strsm_LTLU |
430 | | #define STRSM_LCLN strsm_LTLN |
431 | 0 | #define STRSM_RNUU strsm_RNUU |
432 | 0 | #define STRSM_RNUN strsm_RNUN |
433 | 0 | #define STRSM_RNLU strsm_RNLU |
434 | 0 | #define STRSM_RNLN strsm_RNLN |
435 | | #define STRSM_RTUU strsm_RTUU |
436 | | #define STRSM_RTUN strsm_RTUN |
437 | | #define STRSM_RTLU strsm_RTLU |
438 | | #define STRSM_RTLN strsm_RTLN |
439 | | #define STRSM_RRUU strsm_RNUU |
440 | | #define STRSM_RRUN strsm_RNUN |
441 | | #define STRSM_RRLU strsm_RNLU |
442 | | #define STRSM_RRLN strsm_RNLN |
443 | | #define STRSM_RCUU strsm_RTUU |
444 | | #define STRSM_RCUN strsm_RTUN |
445 | | #define STRSM_RCLU strsm_RTLU |
446 | | #define STRSM_RCLN strsm_RTLN |
447 | | |
448 | | #define SGEMM_THREAD_NN sgemm_thread_nn |
449 | | #define SGEMM_THREAD_CN sgemm_thread_tn |
450 | | #define SGEMM_THREAD_TN sgemm_thread_tn |
451 | | #define SGEMM_THREAD_NC sgemm_thread_nt |
452 | | #define SGEMM_THREAD_NT sgemm_thread_nt |
453 | | #define SGEMM_THREAD_CC sgemm_thread_tt |
454 | | #define SGEMM_THREAD_CT sgemm_thread_tt |
455 | | #define SGEMM_THREAD_TC sgemm_thread_tt |
456 | | #define SGEMM_THREAD_TT sgemm_thread_tt |
457 | | #define SGEMM_THREAD_NR sgemm_thread_nn |
458 | | #define SGEMM_THREAD_TR sgemm_thread_tn |
459 | | #define SGEMM_THREAD_CR sgemm_thread_tn |
460 | | #define SGEMM_THREAD_RN sgemm_thread_nn |
461 | | #define SGEMM_THREAD_RT sgemm_thread_nt |
462 | | #define SGEMM_THREAD_RC sgemm_thread_nt |
463 | | #define SGEMM_THREAD_RR sgemm_thread_nn |
464 | | |
465 | | #define SSYMM_THREAD_LU ssymm_thread_LU |
466 | | #define SSYMM_THREAD_LL ssymm_thread_LL |
467 | | #define SSYMM_THREAD_RU ssymm_thread_RU |
468 | | #define SSYMM_THREAD_RL ssymm_thread_RL |
469 | | |
470 | | #define SHEMM_THREAD_LU shemm_thread_LU |
471 | | #define SHEMM_THREAD_LL shemm_thread_LL |
472 | | #define SHEMM_THREAD_RU shemm_thread_RU |
473 | | #define SHEMM_THREAD_RL shemm_thread_RL |
474 | | |
475 | | #define SSYRK_THREAD_UN ssyrk_thread_UN |
476 | | #define SSYRK_THREAD_UT ssyrk_thread_UT |
477 | | #define SSYRK_THREAD_LN ssyrk_thread_LN |
478 | | #define SSYRK_THREAD_LT ssyrk_thread_LT |
479 | | #define SSYRK_THREAD_UR ssyrk_thread_UN |
480 | | #define SSYRK_THREAD_UC ssyrk_thread_UT |
481 | | #define SSYRK_THREAD_LR ssyrk_thread_LN |
482 | | #define SSYRK_THREAD_LC ssyrk_thread_LT |
483 | | |
484 | | #define SHERK_THREAD_UN ssyrk_thread_UN |
485 | | #define SHERK_THREAD_UT ssyrk_thread_UT |
486 | | #define SHERK_THREAD_LN ssyrk_thread_LN |
487 | | #define SHERK_THREAD_LT ssyrk_thread_LT |
488 | | #define SHERK_THREAD_UR ssyrk_thread_UN |
489 | | #define SHERK_THREAD_UC ssyrk_thread_UT |
490 | | #define SHERK_THREAD_LR ssyrk_thread_LN |
491 | | #define SHERK_THREAD_LC ssyrk_thread_LT |
492 | | |
493 | | #endif |