1 /*****************************************************************************
2   Copyright (c) 2014, Intel Corp.
3   All rights reserved.
4 
5   Redistribution and use in source and binary forms, with or without
6   modification, are permitted provided that the following conditions are met:
7 
8     * Redistributions of source code must retain the above copyright notice,
9       this list of conditions and the following disclaimer.
10     * Redistributions in binary form must reproduce the above copyright
11       notice, this list of conditions and the following disclaimer in the
12       documentation and/or other materials provided with the distribution.
13     * Neither the name of Intel Corporation nor the names of its contributors
14       may be used to endorse or promote products derived from this software
15       without specific prior written permission.
16 
17   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18   AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19   IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20   ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
21   LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
22   CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
23   SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
24   INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
25   CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
26   ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
27   THE POSSIBILITY OF SUCH DAMAGE.
28 *****************************************************************************
29 * Contents: Native middle-level C interface to LAPACK function sgbrfs
30 * Author: Intel Corporation
31 *****************************************************************************/
32 
33 #include "lapacke_utils.h"
34 
LAPACKE_sgbrfs_work(int matrix_layout,char trans,lapack_int n,lapack_int kl,lapack_int ku,lapack_int nrhs,const float * ab,lapack_int ldab,const float * afb,lapack_int ldafb,const lapack_int * ipiv,const float * b,lapack_int ldb,float * x,lapack_int ldx,float * ferr,float * berr,float * work,lapack_int * iwork)35 lapack_int LAPACKE_sgbrfs_work( int matrix_layout, char trans, lapack_int n,
36                                 lapack_int kl, lapack_int ku, lapack_int nrhs,
37                                 const float* ab, lapack_int ldab,
38                                 const float* afb, lapack_int ldafb,
39                                 const lapack_int* ipiv, const float* b,
40                                 lapack_int ldb, float* x, lapack_int ldx,
41                                 float* ferr, float* berr, float* work,
42                                 lapack_int* iwork )
43 {
44     lapack_int info = 0;
45     if( matrix_layout == LAPACK_COL_MAJOR ) {
46         /* Call LAPACK function and adjust info */
47         LAPACK_sgbrfs( &trans, &n, &kl, &ku, &nrhs, ab, &ldab, afb, &ldafb,
48                        ipiv, b, &ldb, x, &ldx, ferr, berr, work, iwork, &info );
49         if( info < 0 ) {
50             info = info - 1;
51         }
52     } else if( matrix_layout == LAPACK_ROW_MAJOR ) {
53         lapack_int ldab_t = MAX(1,kl+ku+1);
54         lapack_int ldafb_t = MAX(1,2*kl+ku+1);
55         lapack_int ldb_t = MAX(1,n);
56         lapack_int ldx_t = MAX(1,n);
57         float* ab_t = NULL;
58         float* afb_t = NULL;
59         float* b_t = NULL;
60         float* x_t = NULL;
61         /* Check leading dimension(s) */
62         if( ldab < n ) {
63             info = -8;
64             LAPACKE_xerbla( "LAPACKE_sgbrfs_work", info );
65             return info;
66         }
67         if( ldafb < n ) {
68             info = -10;
69             LAPACKE_xerbla( "LAPACKE_sgbrfs_work", info );
70             return info;
71         }
72         if( ldb < nrhs ) {
73             info = -13;
74             LAPACKE_xerbla( "LAPACKE_sgbrfs_work", info );
75             return info;
76         }
77         if( ldx < nrhs ) {
78             info = -15;
79             LAPACKE_xerbla( "LAPACKE_sgbrfs_work", info );
80             return info;
81         }
82         /* Allocate memory for temporary array(s) */
83         ab_t = (float*)LAPACKE_malloc( sizeof(float) * ldab_t * MAX(1,n) );
84         if( ab_t == NULL ) {
85             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
86             goto exit_level_0;
87         }
88         afb_t = (float*)LAPACKE_malloc( sizeof(float) * ldafb_t * MAX(1,n) );
89         if( afb_t == NULL ) {
90             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
91             goto exit_level_1;
92         }
93         b_t = (float*)LAPACKE_malloc( sizeof(float) * ldb_t * MAX(1,nrhs) );
94         if( b_t == NULL ) {
95             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
96             goto exit_level_2;
97         }
98         x_t = (float*)LAPACKE_malloc( sizeof(float) * ldx_t * MAX(1,nrhs) );
99         if( x_t == NULL ) {
100             info = LAPACK_TRANSPOSE_MEMORY_ERROR;
101             goto exit_level_3;
102         }
103         /* Transpose input matrices */
104         LAPACKE_sgb_trans( matrix_layout, n, n, kl, ku, ab, ldab, ab_t, ldab_t );
105         LAPACKE_sgb_trans( matrix_layout, n, n, kl, kl+ku, afb, ldafb, afb_t,
106                            ldafb_t );
107         LAPACKE_sge_trans( matrix_layout, n, nrhs, b, ldb, b_t, ldb_t );
108         LAPACKE_sge_trans( matrix_layout, n, nrhs, x, ldx, x_t, ldx_t );
109         /* Call LAPACK function and adjust info */
110         LAPACK_sgbrfs( &trans, &n, &kl, &ku, &nrhs, ab_t, &ldab_t, afb_t,
111                        &ldafb_t, ipiv, b_t, &ldb_t, x_t, &ldx_t, ferr, berr,
112                        work, iwork, &info );
113         if( info < 0 ) {
114             info = info - 1;
115         }
116         /* Transpose output matrices */
117         LAPACKE_sge_trans( LAPACK_COL_MAJOR, n, nrhs, x_t, ldx_t, x, ldx );
118         /* Release memory and exit */
119         LAPACKE_free( x_t );
120 exit_level_3:
121         LAPACKE_free( b_t );
122 exit_level_2:
123         LAPACKE_free( afb_t );
124 exit_level_1:
125         LAPACKE_free( ab_t );
126 exit_level_0:
127         if( info == LAPACK_TRANSPOSE_MEMORY_ERROR ) {
128             LAPACKE_xerbla( "LAPACKE_sgbrfs_work", info );
129         }
130     } else {
131         info = -1;
132         LAPACKE_xerbla( "LAPACKE_sgbrfs_work", info );
133     }
134     return info;
135 }
136