blob: 32e1e0a3c2c50c88e2fbd967d2a1d361929582b4 [file] [log] [blame]
/**************************************************************************************************
* *
* This file is part of BLASFEO. *
* *
* BLASFEO -- BLAS For Embedded Optimization. *
* Copyright (C) 2016-2017 by Gianluca Frison. *
* Developed at IMTEK (University of Freiburg) under the supervision of Moritz Diehl. *
* All rights reserved. *
* *
* HPMPC is free software; you can redistribute it and/or *
* modify it under the terms of the GNU Lesser General Public *
* License as published by the Free Software Foundation; either *
* version 2.1 of the License, or (at your option) any later version. *
* *
* HPMPC is distributed in the hope that it will be useful, *
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. *
* See the GNU Lesser General Public License for more details. *
* *
* You should have received a copy of the GNU Lesser General Public *
* License along with HPMPC; if not, write to the Free Software *
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA *
* *
* Author: Gianluca Frison, giaf (at) dtu.dk *
* gianluca.frison (at) imtek.uni-freiburg.de *
* *
**************************************************************************************************/
#if defined(LA_REFERENCE)
void GEMV_N_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi)
{
int ii, jj;
REAL
y_0, y_1, y_2, y_3,
x_0, x_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *y = sy->pa + yi;
REAL *z = sz->pa + zi;
#if 1 // y reg version
ii = 0;
for(; ii<m-1; ii+=2)
{
y_0 = 0.0;
y_1 = 0.0;
jj = 0;
for(; jj<n-1; jj+=2)
{
y_0 += pA[ii+0+lda*(jj+0)] * x[jj+0] + pA[ii+0+lda*(jj+1)] * x[jj+1];
y_1 += pA[ii+1+lda*(jj+0)] * x[jj+0] + pA[ii+1+lda*(jj+1)] * x[jj+1];
}
if(jj<n)
{
y_0 += pA[ii+0+lda*jj] * x[jj];
y_1 += pA[ii+1+lda*jj] * x[jj];
}
z[ii+0] = beta * y[ii+0] + alpha * y_0;
z[ii+1] = beta * y[ii+1] + alpha * y_1;
}
for(; ii<m; ii++)
{
y_0 = 0.0;
for(jj=0; jj<n; jj++)
{
y_0 += pA[ii+lda*jj] * x[jj];
}
z[ii] = beta * y[ii] + alpha * y_0;
}
#else // x reg version
for(ii=0; ii<n; ii++)
{
z[ii] = beta * y[ii];
}
jj = 0;
for(; jj<n-1; jj+=2)
{
x_0 = alpha * x[jj+0];
x_1 = alpha * x[jj+1];
ii = 0;
for(; ii<m-1; ii+=2)
{
z[ii+0] += pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1;
z[ii+1] += pA[ii+1+lda*(jj+0)] * x_0 + pA[ii+1+lda*(jj+1)] * x_1;
}
for(; ii<m; ii++)
{
z[ii] += pA[ii+lda*(jj+0)] * x_0;
z[ii] += pA[ii+lda*(jj+1)] * x_1;
}
}
for(; jj<n; jj++)
{
x_0 = alpha * x[jj+0];
for(ii=0; ii<m; ii++)
{
z[ii] += pA[ii+lda*(jj+0)] * x_0;
}
}
#endif
return;
}
void GEMV_T_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi)
{
int ii, jj;
REAL
y_0, y_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *y = sy->pa + yi;
REAL *z = sz->pa + zi;
jj = 0;
for(; jj<n-1; jj+=2)
{
y_0 = 0.0;
y_1 = 0.0;
ii = 0;
for(; ii<m-1; ii+=2)
{
y_0 += pA[ii+0+lda*(jj+0)] * x[ii+0] + pA[ii+1+lda*(jj+0)] * x[ii+1];
y_1 += pA[ii+0+lda*(jj+1)] * x[ii+0] + pA[ii+1+lda*(jj+1)] * x[ii+1];
}
if(ii<m)
{
y_0 += pA[ii+lda*(jj+0)] * x[ii];
y_1 += pA[ii+lda*(jj+1)] * x[ii];
}
z[jj+0] = beta * y[jj+0] + alpha * y_0;
z[jj+1] = beta * y[jj+1] + alpha * y_1;
}
for(; jj<n; jj++)
{
y_0 = 0.0;
for(ii=0; ii<m; ii++)
{
y_0 += pA[ii+lda*(jj+0)] * x[ii];
}
z[jj+0] = beta * y[jj+0] + alpha * y_0;
}
return;
}
// TODO optimize !!!!!
void GEMV_NT_LIBSTR(int m, int n, REAL alpha_n, REAL alpha_t, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx_n, int xi_n, struct STRVEC *sx_t, int xi_t, REAL beta_n, REAL beta_t, struct STRVEC *sy_n, int yi_n, struct STRVEC *sy_t, int yi_t, struct STRVEC *sz_n, int zi_n, struct STRVEC *sz_t, int zi_t)
{
int ii, jj;
REAL
a_00,
x_n_0,
y_t_0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x_n = sx_n->pa + xi_n;
REAL *x_t = sx_t->pa + xi_t;
REAL *y_n = sy_n->pa + yi_n;
REAL *y_t = sy_t->pa + yi_t;
REAL *z_n = sz_n->pa + zi_n;
REAL *z_t = sz_t->pa + zi_t;
for(ii=0; ii<m; ii++)
{
z_n[ii] = beta_n * y_n[ii];
}
for(jj=0; jj<n; jj++)
{
y_t_0 = 0.0;
x_n_0 = alpha_n * x_n[jj];
for(ii=0; ii<m; ii++)
{
a_00 = pA[ii+lda*jj];
z_n[ii] += a_00 * x_n_0;
y_t_0 += a_00 * x_t[ii];
}
z_t[jj] = beta_t * y_t[jj] + alpha_t * y_t_0;
}
return;
}
// TODO optimize !!!!!
void SYMV_L_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi)
{
int ii, jj;
REAL
y_0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *y = sy->pa + yi;
REAL *z = sz->pa + zi;
for(ii=0; ii<n; ii++)
{
y_0 = 0.0;
jj = 0;
for(; jj<=ii; jj++)
{
y_0 += pA[ii+lda*jj] * x[jj];
}
for( ; jj<m; jj++)
{
y_0 += pA[jj+lda*ii] * x[jj];
}
z[ii] = beta * y[ii] + alpha * y_0;
}
return;
}
void TRMV_LNN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
int ii, jj;
REAL
y_0, y_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
if(m-n>0)
{
GEMV_N_LIBSTR(m-n, n, 1.0, sA, ai+n, aj, sx, xi, 0.0, sz, zi+n, sz, zi+n);
}
if(n%2!=0)
{
ii = n-1;
y_0 = x[ii];
y_0 *= pA[ii+lda*ii];
for(jj=0; jj<ii; jj++)
{
y_0 += pA[ii+lda*jj] * x[jj];
}
z[ii] = y_0;
n -= 1;
}
for(ii=n-2; ii>=0; ii-=2)
{
y_0 = x[ii+0];
y_1 = x[ii+1];
y_1 *= pA[ii+1+lda*(ii+1)];
y_1 += pA[ii+1+lda*(ii+0)] * y_0;
y_0 *= pA[ii+0+lda*(ii+0)];
jj = 0;
for(; jj<ii-1; jj+=2)
{
y_0 += pA[ii+0+lda*(jj+0)] * x[jj+0] + pA[ii+0+lda*(jj+1)] * x[jj+1];
y_1 += pA[ii+1+lda*(jj+0)] * x[jj+0] + pA[ii+1+lda*(jj+1)] * x[jj+1];
}
// XXX there is no clean up loop !!!!!
// for(; jj<ii; jj++)
// {
// y_0 += pA[ii+0+lda*jj] * x[jj];
// y_1 += pA[ii+1+lda*jj] * x[jj];
// }
z[ii+0] = y_0;
z[ii+1] = y_1;
}
return;
}
void TRMV_LTN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
int ii, jj;
REAL
y_0, y_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
jj = 0;
for(; jj<n-1; jj+=2)
{
y_0 = x[jj+0];
y_1 = x[jj+1];
y_0 *= pA[jj+0+lda*(jj+0)];
y_0 += pA[jj+1+lda*(jj+0)] * y_1;
y_1 *= pA[jj+1+lda*(jj+1)];
ii = jj+2;
for(; ii<m-1; ii+=2)
{
y_0 += pA[ii+0+lda*(jj+0)] * x[ii+0] + pA[ii+1+lda*(jj+0)] * x[ii+1];
y_1 += pA[ii+0+lda*(jj+1)] * x[ii+0] + pA[ii+1+lda*(jj+1)] * x[ii+1];
}
for(; ii<m; ii++)
{
y_0 += pA[ii+lda*(jj+0)] * x[ii];
y_1 += pA[ii+lda*(jj+1)] * x[ii];
}
z[jj+0] = y_0;
z[jj+1] = y_1;
}
for(; jj<n; jj++)
{
y_0 = x[jj];
y_0 *= pA[jj+lda*jj];
for(ii=jj+1; ii<m; ii++)
{
y_0 += pA[ii+lda*jj] * x[ii];
}
z[jj] = y_0;
}
return;
}
void TRMV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
int ii, jj;
REAL
y_0, y_1,
x_0, x_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
#if 1 // y reg version
jj = 0;
for(; jj<m-1; jj+=2)
{
y_0 = x[jj+0];
y_1 = x[jj+1];
y_0 = pA[jj+0+lda*(jj+0)] * y_0;
y_0 += pA[jj+0+lda*(jj+1)] * y_1;
y_1 = pA[jj+1+lda*(jj+1)] * y_1;
ii = jj+2;
for(; ii<m-1; ii+=2)
{
y_0 += pA[jj+0+lda*(ii+0)] * x[ii+0] + pA[jj+0+lda*(ii+1)] * x[ii+1];
y_1 += pA[jj+1+lda*(ii+0)] * x[ii+0] + pA[jj+1+lda*(ii+1)] * x[ii+1];
}
if(ii<m)
{
y_0 += pA[jj+0+lda*(ii+0)] * x[ii+0];
y_1 += pA[jj+1+lda*(ii+0)] * x[ii+0];
}
z[jj+0] = y_0;
z[jj+1] = y_1;
}
for(; jj<m; jj++)
{
y_0 = pA[jj+lda*jj] * x[jj];
for(ii=jj+1; ii<m; ii++)
{
y_0 += pA[jj+lda*ii] * x[ii];
}
z[jj] = y_0;
}
#else // x reg version
if(x != z)
{
for(ii=0; ii<m; ii++)
z[ii] = x[ii];
}
jj = 0;
for(; jj<m-1; jj+=2)
{
x_0 = z[jj+0];
x_1 = z[jj+1];
ii = 0;
for(; ii<jj-1; ii+=2)
{
z[ii+0] += pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1;
z[ii+1] += pA[ii+1+lda*(jj+0)] * x_0 + pA[ii+1+lda*(jj+1)] * x_1;
}
// XXX there is no clean-up loop, since jj+=2 !!!!!
// for(; ii<jj; ii++)
// {
// z[ii+0] += pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1;
// }
x_0 *= pA[jj+0+lda*(jj+0)];
x_0 += pA[jj+0+lda*(jj+1)] * x_1;
x_1 *= pA[jj+1+lda*(jj+1)];
z[jj+0] = x_0;
z[jj+1] = x_1;
}
for(; jj<m; jj++)
{
x_0 = z[jj];
for(ii=0; ii<jj; ii++)
{
z[ii] += pA[ii+lda*jj] * x_0;
}
x_0 *= pA[jj+lda*jj];
z[jj] = x_0;
}
#endif
return;
}
void TRMV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
int ii, jj;
REAL
y_0, y_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
if(m%2!=0)
{
jj = m-1;
y_0 = pA[jj+lda*jj] * x[jj];
for(ii=0; ii<jj; ii++)
{
y_0 += pA[ii+lda*jj] * x[ii];
}
z[jj] = y_0;
m -= 1; // XXX
}
for(jj=m-2; jj>=0; jj-=2)
{
y_1 = pA[jj+1+lda*(jj+1)] * x[jj+1];
y_1 += pA[jj+0+lda*(jj+1)] * x[jj+0];
y_0 = pA[jj+0+lda*(jj+0)] * x[jj+0];
for(ii=0; ii<jj-1; ii+=2)
{
y_0 += pA[ii+0+lda*(jj+0)] * x[ii+0] + pA[ii+1+lda*(jj+0)] * x[ii+1];
y_1 += pA[ii+0+lda*(jj+1)] * x[ii+0] + pA[ii+1+lda*(jj+1)] * x[ii+1];
}
// XXX there is no clean-up loop !!!!!
// if(ii<jj)
// {
// y_0 += pA[ii+lda*(jj+0)] * x[ii];
// y_1 += pA[ii+lda*(jj+1)] * x[ii];
// }
z[jj+0] = y_0;
z[jj+1] = y_1;
}
return;
}
void TRSV_LNN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0 | n==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_lnn_mn_libstr : m<0 : %d<0 *****\n", m);
if(n<0) printf("\n****** trsv_lnn_mn_libstr : n<0 : %d<0 *****\n", n);
// non-negative offset
if(ai<0) printf("\n****** trsv_lnn_mn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_lnn_mn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_lnn_mn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_lnn_mn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_lnn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+n > sA->n) printf("\n***** trsv_lnn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_lnn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_lnn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
int ii, jj, j1;
REAL
y_0, y_1,
x_0, x_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *dA = sA->dA;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
if(ai==0 & aj==0)
{
if(sA->use_dA!=1)
{
for(ii=0; ii<n; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 1;
}
}
else
{
for(ii=0; ii<n; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 0;
}
#if 1 // y reg version
ii = 0;
for(; ii<n-1; ii+=2)
{
y_0 = x[ii+0];
y_1 = x[ii+1];
jj = 0;
for(; jj<ii-1; jj+=2)
{
y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0] + pA[ii+0+lda*(jj+1)] * z[jj+1];
y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0] + pA[ii+1+lda*(jj+1)] * z[jj+1];
}
// XXX there is no clean-up loop !!!!!
// if(jj<ii)
// {
// y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0];
// y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0];
// }
y_0 *= dA[ii+0];
y_1 -= pA[ii+1+lda*(jj+0)] * y_0;
y_1 *= dA[ii+1];
z[ii+0] = y_0;
z[ii+1] = y_1;
}
for(; ii<n; ii++)
{
y_0 = x[ii];
for(jj=0; jj<ii; jj++)
{
y_0 -= pA[ii+lda*jj] * z[jj];
}
y_0 *= dA[ii];
z[ii] = y_0;
}
for(; ii<m-1; ii+=2)
{
y_0 = x[ii+0];
y_1 = x[ii+1];
jj = 0;
for(; jj<n-1; jj+=2)
{
y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0] + pA[ii+0+lda*(jj+1)] * z[jj+1];
y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0] + pA[ii+1+lda*(jj+1)] * z[jj+1];
}
if(jj<n)
{
y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0];
y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0];
}
z[ii+0] = y_0;
z[ii+1] = y_1;
}
for(; ii<m; ii++)
{
y_0 = x[ii];
for(jj=0; jj<n; jj++)
{
y_0 -= pA[ii+lda*jj] * z[jj];
}
z[ii] = y_0;
}
#else // x reg version
if(x != z)
{
for(ii=0; ii<m; ii++)
z[ii] = x[ii];
}
jj = 0;
for(; jj<n-1; jj+=2)
{
x_0 = dA[jj+0] * z[jj+0];
x_1 = z[jj+1] - pA[jj+1+lda*(jj+0)] * x_0;
x_1 = dA[jj+1] * x_1;
z[jj+0] = x_0;
z[jj+1] = x_1;
ii = jj+2;
for(; ii<m-1; ii+=2)
{
z[ii+0] -= pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1;
z[ii+1] -= pA[ii+1+lda*(jj+0)] * x_0 + pA[ii+1+lda*(jj+1)] * x_1;
}
for(; ii<m; ii++)
{
z[ii] -= pA[ii+lda*(jj+0)] * x_0 + pA[ii+lda*(jj+1)] * x_1;
}
}
for(; jj<n; jj++)
{
x_0 = dA[jj] * z[jj];
z[jj] = x_0;
for(ii=jj+1; ii<m; ii++)
{
z[ii] -= pA[ii+lda*jj] * x_0;
}
}
#endif
return;
}
void TRSV_LTN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_ltn_mn_libstr : m<0 : %d<0 *****\n", m);
if(n<0) printf("\n****** trsv_ltn_mn_libstr : n<0 : %d<0 *****\n", n);
// non-negative offset
if(ai<0) printf("\n****** trsv_ltn_mn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_ltn_mn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_ltn_mn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_ltn_mn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_ltn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+n > sA->n) printf("\n***** trsv_ltn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_ltn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_ltn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
int ii, jj;
REAL
y_0, y_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *dA = sA->dA;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
if(ai==0 & aj==0)
{
if(sA->use_dA!=1)
{
for(ii=0; ii<n; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 1;
}
}
else
{
for(ii=0; ii<n; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 0;
}
if(n%2!=0)
{
jj = n-1;
y_0 = x[jj];
for(ii=jj+1; ii<m; ii++)
{
y_0 -= pA[ii+lda*jj] * z[ii];
}
y_0 *= dA[jj];
z[jj] = y_0;
jj -= 2;
}
else
{
jj = n-2;
}
for(; jj>=0; jj-=2)
{
y_0 = x[jj+0];
y_1 = x[jj+1];
ii = jj+2;
for(; ii<m-1; ii+=2)
{
y_0 -= pA[ii+0+lda*(jj+0)] * z[ii+0] + pA[ii+1+lda*(jj+0)] * z[ii+1];
y_1 -= pA[ii+0+lda*(jj+1)] * z[ii+0] + pA[ii+1+lda*(jj+1)] * z[ii+1];
}
if(ii<m)
{
y_0 -= pA[ii+lda*(jj+0)] * z[ii];
y_1 -= pA[ii+lda*(jj+1)] * z[ii];
}
y_1 *= dA[jj+1];
y_0 -= pA[jj+1+lda*(jj+0)] * y_1;
y_0 *= dA[jj+0];
z[jj+0] = y_0;
z[jj+1] = y_1;
}
return;
}
void TRSV_LNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_lnn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_lnn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_lnn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_lnn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_lnn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_lnn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_lnn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_lnn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_lnn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
int ii, jj, j1;
REAL
y_0, y_1,
x_0, x_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *dA = sA->dA;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
if(ai==0 & aj==0)
{
if(sA->use_dA!=1)
{
for(ii=0; ii<m; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 1;
}
}
else
{
for(ii=0; ii<m; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 0;
}
ii = 0;
for(; ii<m-1; ii+=2)
{
y_0 = x[ii+0];
y_1 = x[ii+1];
jj = 0;
for(; jj<ii-1; jj+=2)
{
y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0] + pA[ii+0+lda*(jj+1)] * z[jj+1];
y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0] + pA[ii+1+lda*(jj+1)] * z[jj+1];
}
y_0 *= dA[ii+0];
y_1 -= pA[ii+1+lda*(jj+0)] * y_0;
y_1 *= dA[ii+1];
z[ii+0] = y_0;
z[ii+1] = y_1;
}
for(; ii<m; ii++)
{
y_0 = x[ii];
for(jj=0; jj<ii; jj++)
{
y_0 -= pA[ii+lda*jj] * z[jj];
}
y_0 *= dA[ii];
z[ii] = y_0;
}
return;
}
void TRSV_LNU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_lnu_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_lnu_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_lnu_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_lnu_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_lnu_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_lnu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_lnu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_lnu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_lnu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
printf("\n***** trsv_lnu_libstr : feature not implemented yet *****\n");
exit(1);
}
void TRSV_LTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_ltn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_ltn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_ltn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_ltn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_ltn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_ltn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_ltn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_ltn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_ltn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
int ii, jj;
REAL
y_0, y_1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *dA = sA->dA;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
if(ai==0 & aj==0)
{
if(sA->use_dA!=1)
{
for(ii=0; ii<m; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 1;
}
}
else
{
for(ii=0; ii<m; ii++)
dA[ii] = 1.0 / pA[ii+lda*ii];
sA->use_dA = 0;
}
if(m%2!=0)
{
jj = m-1;
y_0 = x[jj];
y_0 *= dA[jj];
z[jj] = y_0;
jj -= 2;
}
else
{
jj = m-2;
}
for(; jj>=0; jj-=2)
{
y_0 = x[jj+0];
y_1 = x[jj+1];
ii = jj+2;
for(; ii<m-1; ii+=2)
{
y_0 -= pA[ii+0+lda*(jj+0)] * z[ii+0] + pA[ii+1+lda*(jj+0)] * z[ii+1];
y_1 -= pA[ii+0+lda*(jj+1)] * z[ii+0] + pA[ii+1+lda*(jj+1)] * z[ii+1];
}
if(ii<m)
{
y_0 -= pA[ii+lda*(jj+0)] * z[ii];
y_1 -= pA[ii+lda*(jj+1)] * z[ii];
}
y_1 *= dA[jj+1];
y_0 -= pA[jj+1+lda*(jj+0)] * y_1;
y_0 *= dA[jj+0];
z[jj+0] = y_0;
z[jj+1] = y_1;
}
return;
}
void TRSV_LTU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_ltu_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_ltu_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_ltu_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_ltu_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_ltu_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_ltu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_ltu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_ltu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_ltu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
printf("\n***** trsv_ltu_libstr : feature not implemented yet *****\n");
exit(1);
}
void TRSV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_unn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_unn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_unn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_unn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_unn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_unn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_unn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_unn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_unn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
printf("\n***** trsv_unn_libstr : feature not implemented yet *****\n");
exit(1);
}
void TRSV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_utn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_utn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_utn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_utn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_utn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_utn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_utn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_utn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_utn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
printf("\n***** trsv_utn_libstr : feature not implemented yet *****\n");
exit(1);
}
#elif defined(LA_BLAS)
void GEMV_N_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *y = sy->pa + yi;
REAL *z = sz->pa + zi;
COPY(&m, y, &i1, z, &i1);
GEMV(&cn, &m, &n, &alpha, pA, &lda, x, &i1, &beta, z, &i1);
return;
}
void GEMV_T_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *y = sy->pa + yi;
REAL *z = sz->pa + zi;
COPY(&n, y, &i1, z, &i1);
GEMV(&ct, &m, &n, &alpha, pA, &lda, x, &i1, &beta, z, &i1);
return;
}
void GEMV_NT_LIBSTR(int m, int n, REAL alpha_n, REAL alpha_t, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx_n, int xi_n, struct STRVEC *sx_t, int xi_t, REAL beta_n, REAL beta_t, struct STRVEC *sy_n, int yi_n, struct STRVEC *sy_t, int yi_t, struct STRVEC *sz_n, int zi_n, struct STRVEC *sz_t, int zi_t)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x_n = sx_n->pa + xi_n;
REAL *x_t = sx_t->pa + xi_t;
REAL *y_n = sy_n->pa + yi_n;
REAL *y_t = sy_t->pa + yi_t;
REAL *z_n = sz_n->pa + zi_n;
REAL *z_t = sz_t->pa + zi_t;
COPY(&m, y_n, &i1, z_n, &i1);
GEMV(&cn, &m, &n, &alpha_n, pA, &lda, x_n, &i1, &beta_n, z_n, &i1);
COPY(&n, y_t, &i1, z_t, &i1);
GEMV(&ct, &m, &n, &alpha_t, pA, &lda, x_t, &i1, &beta_t, z_t, &i1);
return;
}
void SYMV_L_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *y = sy->pa + yi;
REAL *z = sz->pa + zi;
int tmp = m-n;
COPY(&m, y, &i1, z, &i1);
SYMV(&cl, &n, &alpha, pA, &lda, x, &i1, &beta, z, &i1);
GEMV(&cn, &tmp, &n, &alpha, pA+n, &lda, x, &i1, &beta, z+n, &i1);
GEMV(&ct, &tmp, &n, &alpha, pA+n, &lda, x+n, &i1, &d1, z, &i1);
return;
}
void TRMV_LNN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL d0 = 0.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
int tmp = m-n;
if(x!=z)
COPY(&n, x, &i1, z, &i1);
GEMV(&cn, &tmp, &n, &d1, pA+n, &lda, x, &i1, &d0, z+n, &i1);
TRMV(&cl, &cn, &cn, &n, pA, &lda, z, &i1);
return;
}
void TRMV_LTN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
int tmp = m-n;
if(x!=z)
COPY(&n, x, &i1, z, &i1);
TRMV(&cl, &ct, &cn, &n, pA, &lda, z, &i1);
GEMV(&ct, &tmp, &n, &d1, pA+n, &lda, x+n, &i1, &d1, z, &i1);
return;
}
void TRMV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRMV(&cu, &cn, &cn, &m, pA, &lda, z, &i1);
return;
}
void TRMV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRMV(&cu, &ct, &cn, &m, pA, &lda, z, &i1);
return;
}
void TRSV_LNN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0 | n==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_lnn_mn_libstr : m<0 : %d<0 *****\n", m);
if(n<0) printf("\n****** trsv_lnn_mn_libstr : n<0 : %d<0 *****\n", n);
// non-negative offset
if(ai<0) printf("\n****** trsv_lnn_mn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_lnn_mn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_lnn_mn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_lnn_mn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_lnn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+n > sA->n) printf("\n***** trsv_lnn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_lnn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_lnn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int mmn = m-n;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRSV(&cl, &cn, &cn, &n, pA, &lda, z, &i1);
GEMV(&cn, &mmn, &n, &dm1, pA+n, &lda, z, &i1, &d1, z+n, &i1);
return;
}
void TRSV_LTN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_ltn_mn_libstr : m<0 : %d<0 *****\n", m);
if(n<0) printf("\n****** trsv_ltn_mn_libstr : n<0 : %d<0 *****\n", n);
// non-negative offset
if(ai<0) printf("\n****** trsv_ltn_mn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_ltn_mn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_ltn_mn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_ltn_mn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_ltn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+n > sA->n) printf("\n***** trsv_ltn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_ltn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_ltn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int mmn = m-n;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
GEMV(&ct, &mmn, &n, &dm1, pA+n, &lda, z+n, &i1, &d1, z, &i1);
TRSV(&cl, &ct, &cn, &n, pA, &lda, z, &i1);
return;
}
void TRSV_LNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_lnn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_lnn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_lnn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_lnn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_lnn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_lnn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_lnn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_lnn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_lnn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRSV(&cl, &cn, &cn, &m, pA, &lda, z, &i1);
return;
}
void TRSV_LNU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_lnu_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_lnu_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_lnu_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_lnu_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_lnu_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_lnu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_lnu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_lnu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_lnu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRSV(&cl, &cn, &cu, &m, pA, &lda, z, &i1);
return;
}
void TRSV_LTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_ltn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_ltn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_ltn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_ltn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_ltn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_ltn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_ltn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_ltn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_ltn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRSV(&cl, &ct, &cn, &m, pA, &lda, z, &i1);
return;
}
void TRSV_LTU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_ltu_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_ltu_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_ltu_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_ltu_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_ltu_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_ltu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_ltu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_ltu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_ltu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRSV(&cl, &ct, &cu, &m, pA, &lda, z, &i1);
return;
}
void TRSV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_unn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_unn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_unn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_unn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_unn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_unn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_unn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_unn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_unn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRSV(&cu, &cn, &cn, &m, pA, &lda, z, &i1);
return;
}
void TRSV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi)
{
if(m==0)
return;
#if defined(DIM_CHECK)
// non-negative size
if(m<0) printf("\n****** trsv_utn_libstr : m<0 : %d<0 *****\n", m);
// non-negative offset
if(ai<0) printf("\n****** trsv_utn_libstr : ai<0 : %d<0 *****\n", ai);
if(aj<0) printf("\n****** trsv_utn_libstr : aj<0 : %d<0 *****\n", aj);
if(xi<0) printf("\n****** trsv_utn_libstr : xi<0 : %d<0 *****\n", xi);
if(zi<0) printf("\n****** trsv_utn_libstr : zi<0 : %d<0 *****\n", zi);
// inside matrix
// A: m x k
if(ai+m > sA->m) printf("\n***** trsv_utn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m);
if(aj+m > sA->n) printf("\n***** trsv_utn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n);
// x: m
if(xi+m > sx->m) printf("\n***** trsv_utn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m);
// z: m
if(zi+m > sz->m) printf("\n***** trsv_utn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m);
#endif
char cl = 'l';
char cn = 'n';
char cr = 'r';
char ct = 't';
char cu = 'u';
int i1 = 1;
REAL d1 = 1.0;
REAL dm1 = -1.0;
int lda = sA->m;
REAL *pA = sA->pA + ai + aj*lda;
REAL *x = sx->pa + xi;
REAL *z = sz->pa + zi;
COPY(&m, x, &i1, z, &i1);
TRSV(&cu, &ct, &cn, &m, pA, &lda, z, &i1);
return;
}
#else
#error : wrong LA choice
#endif