1 /*********************************************************************/
2 /* */
3 /* Optimized BLAS libraries */
4 /* By Kazushige Goto <kgoto@tacc.utexas.edu> */
5 /* */
6 /* Copyright (c) The University of Texas, 2009. All rights reserved. */
7 /* UNIVERSITY EXPRESSLY DISCLAIMS ANY AND ALL WARRANTIES CONCERNING */
8 /* THIS SOFTWARE AND DOCUMENTATION, INCLUDING ANY WARRANTIES OF */
9 /* MERCHANTABILITY, FITNESS FOR ANY PARTICULAR PURPOSE, */
10 /* NON-INFRINGEMENT AND WARRANTIES OF PERFORMANCE, AND ANY WARRANTY */
11 /* THAT MIGHT OTHERWISE ARISE FROM COURSE OF DEALING OR USAGE OF */
12 /* TRADE. NO WARRANTY IS EITHER EXPRESS OR IMPLIED WITH RESPECT TO */
13 /* THE USE OF THE SOFTWARE OR DOCUMENTATION. */
14 /* Under no circumstances shall University be liable for incidental, */
15 /* special, indirect, direct or consequential damages or loss of */
16 /* profits, interruption of business, or related expenses which may */
17 /* arise from use of Software or Documentation, including but not */
18 /* limited to those resulting from defects in Software and/or */
19 /* Documentation, or loss or inaccuracy of data of any kind. */
20 /*********************************************************************/
21
22 #include <stdio.h>
23 #include "common.h"
24 #ifdef FUNCTION_PROFILE
25 #include "functable.h"
26 #endif
27
28 #ifdef XDOUBLE
29 #define ERROR_NAME "QLAUU2"
30 #elif defined(DOUBLE)
31 #define ERROR_NAME "ZLAUU2"
32 #else
33 #define ERROR_NAME "CLAUU2"
34 #endif
35
36 static blasint (*lauu2[])(blas_arg_t *, BLASLONG *, BLASLONG *, FLOAT *, FLOAT *, BLASLONG) = {
37
38 #ifdef XDOUBLE
39 xlauu2_U, xlauu2_L,
40 #elif defined(DOUBLE)
41 zlauu2_U, zlauu2_L,
42 #else
43 clauu2_U, clauu2_L,
44 #endif
45 };
46
NAME(char * UPLO,blasint * N,FLOAT * a,blasint * ldA,blasint * Info)47 int NAME(char *UPLO, blasint *N, FLOAT *a, blasint *ldA, blasint *Info){
48
49 blas_arg_t args;
50
51 blasint uplo_arg = *UPLO;
52 blasint uplo;
53 blasint info;
54 FLOAT *buffer;
55 #ifdef PPC440
56 extern
57 #endif
58 FLOAT *sa, *sb;
59
60 PRINT_DEBUG_NAME;
61
62 args.n = *N;
63 args.a = (void *)a;
64 args.lda = *ldA;
65
66 TOUPPER(uplo_arg);
67
68 uplo = -1;
69 if (uplo_arg == 'U') uplo = 0;
70 if (uplo_arg == 'L') uplo = 1;
71
72 info = 0;
73 if (args.lda < MAX(1,args.n)) info = 4;
74 if (args.n < 0) info = 2;
75 if (uplo < 0) info = 1;
76 if (info) {
77 BLASFUNC(xerbla)(ERROR_NAME, &info, sizeof(ERROR_NAME));
78 *Info = - info;
79 return 0;
80 }
81
82 *Info = 0;
83
84 if (args.n <= 0) return 0;
85
86 IDEBUG_START;
87
88 FUNCTION_PROFILE_START();
89
90 #ifndef PPC440
91 buffer = (FLOAT *)blas_memory_alloc(1);
92
93 sa = (FLOAT *)((BLASLONG)buffer + GEMM_OFFSET_A);
94 sb = (FLOAT *)(((BLASLONG)sa + ((GEMM_P * GEMM_Q * COMPSIZE * SIZE + GEMM_ALIGN) & ~GEMM_ALIGN)) + GEMM_OFFSET_B);
95 #endif
96
97 info = (lauu2[uplo])(&args, NULL, NULL, sa, sb, 0);
98
99 *Info = info;
100
101 #ifndef PPC440
102 blas_memory_free(buffer);
103 #endif
104
105 FUNCTION_PROFILE_END(1, .5 * args.n * args.n,
106 2. * args.n * (1./3. + args.n * ( 1./2. + args.n * 1./6.))
107 + 6. * 1./6. * args.n * (args.n * args.n - 1));
108
109 IDEBUG_END;
110
111 return 0;
112 }
113