1
/* ---------------------------------------------------------------------
3
* -- Automatically Tuned Linear Algebra Software (ATLAS)
4
* (C) Copyright 2000 All Rights Reserved
6
* -- ATLAS routine -- Version 3.0 -- April 1, 2000
8
* -- Suggestions, comments, bugs reports should be sent to the follo-
9
* wing e-mail address: atlas@cs.utk.edu
11
* Author : Antoine P. Petitet
12
* Contributor(s) : R. Clint Whaley
13
* University of Tennessee - Innovative Computing Laboratory
14
* Knoxville TN, 37996-1301, USA.
16
* ---------------------------------------------------------------------
18
* -- Copyright notice and Licensing terms:
20
* Redistribution and use in source and binary forms, with or without
21
* modification, are permitted provided that the following conditions
24
* 1. Redistributions of source code must retain the above copyright
25
* notice, this list of conditions and the following disclaimer.
26
* 2. Redistributions in binary form must reproduce the above copyright
27
* notice, this list of conditions, and the following disclaimer in
28
* the documentation and/or other materials provided with the distri-
30
* 3. The name of the University, the ATLAS group, or the names of its
31
* contributors may not be used to endorse or promote products deri-
32
* ved from this software without specific written permission.
36
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
37
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
38
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
39
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY
40
* OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPE-
41
* CIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
42
* TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,
43
* OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEO-
44
* RY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (IN-
45
* CLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
46
* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
48
* ---------------------------------------------------------------------
53
#include "atlas_misc.h"
56
#include "atlas_level1.h"
57
#include "atlas_kernel2.h"
58
#include "atlas_reflvl2.h"
59
#include "atlas_lvl2.h"
61
void Mjoin( PATL, tpmvLT )
63
const enum ATLAS_DIAG DIAG,
74
* Mjoin( PATL, tpmvLT ) performs the following matrix-vector operation
78
* where x is an n-element vector and A is an n by n unit or non-unit,
79
* lower triangular matrix supplied in packed form.
81
* This is a blocked version of the algorithm. For a more detailed des-
82
* cription of the arguments of this function, see the reference imple-
83
* mentation in the ATLAS/src/blas/reference directory.
85
* ---------------------------------------------------------------------
88
* .. Local Variables ..
93
TYPE one[2] = { ATL_rone, ATL_rzero };
96
int incX, lda, lda0, mb, mb1, n, nb;
97
void (*tpmv0)( const int, const TYPE *, const int,
99
#define gpmv0 Mjoin( PATL, gpmvLT_a1_x1_b1_y1 )
101
* .. Executable Statements ..
104
ATL_GetPartMVT( A, LDA, &mb, &nb );
106
if( DIAG == AtlasNonUnit ) tpmv0 = Mjoin( PATL, tpmvLTN );
107
else tpmv0 = Mjoin( PATL, tpmvLTU );
109
mb1 = N - ( ( N - 1 ) / mb ) * mb; incX = (mb SHIFT);
110
lda = lda0 = LDA; A0 = (TYPE *)(A);
111
tpmv0( mb1, A, lda, X ); MLpnext( mb1, A, lda ); X += (mb1 SHIFT);
113
for( n = mb1; n < N; n += mb, X += incX )
115
gpmv0( n, mb, one, A0 + (n SHIFT), lda0, X, 1, one, x0, 1 );
116
tpmv0( mb, A, lda, X ); MLpnext( mb, A, lda );
119
* End of Mjoin( PATL, tpmvLT )