/root/doris/contrib/openblas/interface/axpy.c
Line | Count | Source |
1 | | /*********************************************************************/ |
2 | | /* Copyright 2009, 2010 The University of Texas at Austin. */ |
3 | | /* All rights reserved. */ |
4 | | /* */ |
5 | | /* Redistribution and use in source and binary forms, with or */ |
6 | | /* without modification, are permitted provided that the following */ |
7 | | /* conditions are met: */ |
8 | | /* */ |
9 | | /* 1. Redistributions of source code must retain the above */ |
10 | | /* copyright notice, this list of conditions and the following */ |
11 | | /* disclaimer. */ |
12 | | /* */ |
13 | | /* 2. Redistributions in binary form must reproduce the above */ |
14 | | /* copyright notice, this list of conditions and the following */ |
15 | | /* disclaimer in the documentation and/or other materials */ |
16 | | /* provided with the distribution. */ |
17 | | /* */ |
18 | | /* THIS SOFTWARE IS PROVIDED BY THE UNIVERSITY OF TEXAS AT */ |
19 | | /* AUSTIN ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, */ |
20 | | /* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF */ |
21 | | /* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE */ |
22 | | /* DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY OF TEXAS AT */ |
23 | | /* AUSTIN OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, */ |
24 | | /* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES */ |
25 | | /* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE */ |
26 | | /* GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR */ |
27 | | /* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF */ |
28 | | /* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT */ |
29 | | /* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT */ |
30 | | /* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE */ |
31 | | /* POSSIBILITY OF SUCH DAMAGE. */ |
32 | | /* */ |
33 | | /* The views and conclusions contained in the software and */ |
34 | | /* documentation are those of the authors and should not be */ |
35 | | /* interpreted as representing official policies, either expressed */ |
36 | | /* or implied, of The University of Texas at Austin. */ |
37 | | /*********************************************************************/ |
38 | | |
39 | | #include <stdio.h> |
40 | | #include "common.h" |
41 | | #ifdef FUNCTION_PROFILE |
42 | | #include "functable.h" |
43 | | #endif |
44 | | #if defined(Z13) |
45 | | #define MULTI_THREAD_MINIMAL 200000 |
46 | | #else |
47 | 0 | #define MULTI_THREAD_MINIMAL 10000 |
48 | | #endif |
49 | | #ifndef CBLAS |
50 | | |
51 | 0 | void NAME(blasint *N, FLOAT *ALPHA, FLOAT *x, blasint *INCX, FLOAT *y, blasint *INCY){ |
52 | |
|
53 | 0 | BLASLONG n = *N; |
54 | 0 | BLASLONG incx = *INCX; |
55 | 0 | BLASLONG incy = *INCY; |
56 | 0 | FLOAT alpha = *ALPHA; |
57 | |
|
58 | | #else |
59 | | |
60 | | void CNAME(blasint n, FLOAT alpha, FLOAT *x, blasint incx, FLOAT *y, blasint incy){ |
61 | | |
62 | | #endif |
63 | |
|
64 | 0 | #ifdef SMP |
65 | 0 | int mode, nthreads; |
66 | 0 | #endif |
67 | |
|
68 | 0 | #ifndef CBLAS |
69 | 0 | PRINT_DEBUG_NAME; |
70 | | #else |
71 | | PRINT_DEBUG_CNAME; |
72 | | #endif |
73 | |
|
74 | 0 | if (n <= 0) return; |
75 | | |
76 | 0 | if (alpha == ZERO) return; |
77 | | |
78 | 0 | if (incx == 0 && incy == 0) { |
79 | 0 | *y += n * alpha *(*x); |
80 | 0 | return; |
81 | 0 | } |
82 | | |
83 | 0 | IDEBUG_START; |
84 | |
|
85 | 0 | FUNCTION_PROFILE_START(); |
86 | |
|
87 | 0 | if (incx < 0) x -= (n - 1) * incx; |
88 | 0 | if (incy < 0) y -= (n - 1) * incy; |
89 | |
|
90 | 0 | #ifdef SMP |
91 | | //disable multi-thread when incx==0 or incy==0 |
92 | | //In that case, the threads would be dependent. |
93 | | // |
94 | | //Temporarily work-around the low performance issue with small input size & |
95 | | //multithreads. |
96 | 0 | if (incx == 0 || incy == 0 || n <= MULTI_THREAD_MINIMAL) |
97 | 0 | nthreads = 1; |
98 | 0 | else |
99 | 0 | nthreads = num_cpu_avail(1); |
100 | |
|
101 | 0 | if (nthreads == 1) { |
102 | 0 | #endif |
103 | |
|
104 | 0 | AXPYU_K(n, 0, 0, alpha, x, incx, y, incy, NULL, 0); |
105 | |
|
106 | 0 | #ifdef SMP |
107 | 0 | } else { |
108 | |
|
109 | | #ifdef XDOUBLE |
110 | | mode = BLAS_XDOUBLE | BLAS_REAL; |
111 | | #elif defined(DOUBLE) |
112 | 0 | mode = BLAS_DOUBLE | BLAS_REAL; |
113 | | #else |
114 | | mode = BLAS_SINGLE | BLAS_REAL; |
115 | | #endif |
116 | |
|
117 | 0 | blas_level1_thread(mode, n, 0, 0, &alpha, |
118 | 0 | x, incx, y, incy, NULL, 0, (int (*)(void))AXPYU_K, nthreads); |
119 | |
|
120 | 0 | } |
121 | 0 | #endif |
122 | |
|
123 | 0 | FUNCTION_PROFILE_END(1, 2 * n, 2 * n); |
124 | |
|
125 | 0 | IDEBUG_END; |
126 | |
|
127 | 0 | return; |
128 | |
|
129 | 0 | } |