2
* Automatically Tuned Linear Algebra Software v3.2
3
* (C) Copyright 1999 R. Clint Whaley
5
* Redistribution and use in source and binary forms, with or without
6
* modification, are permitted provided that the following conditions
8
* 1. Redistributions of source code must retain the above copyright
9
* notice, this list of conditions and the following disclaimer.
10
* 2. Redistributions in binary form must reproduce the above copyright
11
* notice, this list of conditions, and the following disclaimer in the
12
* documentation and/or other materials provided with the distribution.
13
* 3. The name of the University of Tennessee, the ATLAS group,
14
* or the names of its contributers may not be used to endorse
15
* or promote products derived from this software without specific
18
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
20
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
21
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY OR CONTRIBUTORS BE
22
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
23
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
24
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
25
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
26
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
27
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
28
* POSSIBILITY OF SUCH DAMAGE.
33
#include "atlas_misc.h"
35
#ifdef ATL_USEPTHREADS
36
#include "atlas_ptalias2.h"
38
#include "atlas_level2.h"
40
void cblas_chbmv(const enum CBLAS_ORDER Order, const enum CBLAS_UPLO Uplo,
41
const int N, const int K, const void *alpha, const void *A,
42
const int lda, const void *X, const int incX,
43
const void *beta, void *Y, const int incY)
46
const enum CBLAS_UPLO ruplo = (Uplo == CblasUpper) ? CblasLower : CblasUpper;
48
float *X0, *x = (float*) X;
50
const float *alp=alpha;
51
const float *bet=beta;
52
float calpha[2], cbeta[2];
53
const float one[2] = {ATL_rone, ATL_rzero};
59
#ifndef NoCblasErrorChecks
60
if (Order != CblasColMajor && Order != CblasRowMajor)
61
info = cblas_errprn(1, info, "Order must be %d or %d, but is set to %d",
62
CblasRowMajor, CblasColMajor, Order);
63
if (Uplo != CblasUpper && Uplo != CblasLower)
64
info = cblas_errprn(2, info,
65
"Uplo must be %d or %d, but is set to %d",
66
CblasUpper, CblasLower, Uplo);
68
if (N < 0) info = cblas_errprn(3, info,
69
"N cannot be less than zero; is set to %d.", N);
71
info = cblas_errprn(4, info, "Valid K: 0 < K < N; K=%d, N=%d.", K, N);
72
if (lda < K+1) info = cblas_errprn(7, info,
73
"lda cannot be less than K+1; K=%d, lda=%d\n", K, lda);
74
if (!incX) info = cblas_errprn(9, info,
75
"incX cannot be zero; is set to %d.", incX);
76
if (!incY) info = cblas_errprn(12, info,
77
"incY cannot be zero; is set to %d.", incY);
80
cblas_xerbla(info, "cblas_chbmv", "");
85
if (incX < 0) x += (1-N)*incX<<1;
86
if (incY < 0) y += (1-N)*incY<<1;
87
if (Order == CblasColMajor)
88
ATL_chbmv(Uplo, N, K, alpha, A, lda, x, incX, beta, y, incY);
91
vx = malloc(ATL_Cachelen + 2*N*sizeof(float));
95
ATL_cmoveConj(N, calpha, X0, incX, x, 1);
96
if (*bet != ATL_rzero || bet[1] != ATL_rzero)
98
ATL_cscalConj(N, cbeta, y, incY);
99
ATL_chbmv(ruplo, N, K, one, A, lda, x, 1, one, y, incY);
101
else ATL_chbmv(ruplo, N, K, one, A, lda, x, 1, beta, y, incY);
103
ATL_cscalConj(N, one, y, incY);