| /************************************************************************************************** |
| * * |
| * This file is part of BLASFEO. * |
| * * |
| * BLASFEO -- BLAS For Embedded Optimization. * |
| * Copyright (C) 2016-2017 by Gianluca Frison. * |
| * Developed at IMTEK (University of Freiburg) under the supervision of Moritz Diehl. * |
| * All rights reserved. * |
| * * |
| * HPMPC is free software; you can redistribute it and/or * |
| * modify it under the terms of the GNU Lesser General Public * |
| * License as published by the Free Software Foundation; either * |
| * version 2.1 of the License, or (at your option) any later version. * |
| * * |
| * HPMPC is distributed in the hope that it will be useful, * |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of * |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. * |
| * See the GNU Lesser General Public License for more details. * |
| * * |
| * You should have received a copy of the GNU Lesser General Public * |
| * License along with HPMPC; if not, write to the Free Software * |
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA * |
| * * |
| * Author: Gianluca Frison, giaf (at) dtu.dk * |
| * gianluca.frison (at) imtek.uni-freiburg.de * |
| * * |
| **************************************************************************************************/ |
| |
| |
| |
| #if defined(LA_REFERENCE) |
| |
| |
| |
| void GEMV_N_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi) |
| { |
| int ii, jj; |
| REAL |
| y_0, y_1, y_2, y_3, |
| x_0, x_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *y = sy->pa + yi; |
| REAL *z = sz->pa + zi; |
| #if 1 // y reg version |
| ii = 0; |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 = 0.0; |
| y_1 = 0.0; |
| jj = 0; |
| for(; jj<n-1; jj+=2) |
| { |
| y_0 += pA[ii+0+lda*(jj+0)] * x[jj+0] + pA[ii+0+lda*(jj+1)] * x[jj+1]; |
| y_1 += pA[ii+1+lda*(jj+0)] * x[jj+0] + pA[ii+1+lda*(jj+1)] * x[jj+1]; |
| } |
| if(jj<n) |
| { |
| y_0 += pA[ii+0+lda*jj] * x[jj]; |
| y_1 += pA[ii+1+lda*jj] * x[jj]; |
| } |
| z[ii+0] = beta * y[ii+0] + alpha * y_0; |
| z[ii+1] = beta * y[ii+1] + alpha * y_1; |
| } |
| for(; ii<m; ii++) |
| { |
| y_0 = 0.0; |
| for(jj=0; jj<n; jj++) |
| { |
| y_0 += pA[ii+lda*jj] * x[jj]; |
| } |
| z[ii] = beta * y[ii] + alpha * y_0; |
| } |
| #else // x reg version |
| for(ii=0; ii<n; ii++) |
| { |
| z[ii] = beta * y[ii]; |
| } |
| jj = 0; |
| for(; jj<n-1; jj+=2) |
| { |
| x_0 = alpha * x[jj+0]; |
| x_1 = alpha * x[jj+1]; |
| ii = 0; |
| for(; ii<m-1; ii+=2) |
| { |
| z[ii+0] += pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1; |
| z[ii+1] += pA[ii+1+lda*(jj+0)] * x_0 + pA[ii+1+lda*(jj+1)] * x_1; |
| } |
| for(; ii<m; ii++) |
| { |
| z[ii] += pA[ii+lda*(jj+0)] * x_0; |
| z[ii] += pA[ii+lda*(jj+1)] * x_1; |
| } |
| } |
| for(; jj<n; jj++) |
| { |
| x_0 = alpha * x[jj+0]; |
| for(ii=0; ii<m; ii++) |
| { |
| z[ii] += pA[ii+lda*(jj+0)] * x_0; |
| } |
| } |
| #endif |
| return; |
| } |
| |
| |
| |
| void GEMV_T_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi) |
| { |
| int ii, jj; |
| REAL |
| y_0, y_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *y = sy->pa + yi; |
| REAL *z = sz->pa + zi; |
| jj = 0; |
| for(; jj<n-1; jj+=2) |
| { |
| y_0 = 0.0; |
| y_1 = 0.0; |
| ii = 0; |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 += pA[ii+0+lda*(jj+0)] * x[ii+0] + pA[ii+1+lda*(jj+0)] * x[ii+1]; |
| y_1 += pA[ii+0+lda*(jj+1)] * x[ii+0] + pA[ii+1+lda*(jj+1)] * x[ii+1]; |
| } |
| if(ii<m) |
| { |
| y_0 += pA[ii+lda*(jj+0)] * x[ii]; |
| y_1 += pA[ii+lda*(jj+1)] * x[ii]; |
| } |
| z[jj+0] = beta * y[jj+0] + alpha * y_0; |
| z[jj+1] = beta * y[jj+1] + alpha * y_1; |
| } |
| for(; jj<n; jj++) |
| { |
| y_0 = 0.0; |
| for(ii=0; ii<m; ii++) |
| { |
| y_0 += pA[ii+lda*(jj+0)] * x[ii]; |
| } |
| z[jj+0] = beta * y[jj+0] + alpha * y_0; |
| } |
| return; |
| } |
| |
| |
| |
| // TODO optimize !!!!! |
| void GEMV_NT_LIBSTR(int m, int n, REAL alpha_n, REAL alpha_t, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx_n, int xi_n, struct STRVEC *sx_t, int xi_t, REAL beta_n, REAL beta_t, struct STRVEC *sy_n, int yi_n, struct STRVEC *sy_t, int yi_t, struct STRVEC *sz_n, int zi_n, struct STRVEC *sz_t, int zi_t) |
| { |
| int ii, jj; |
| REAL |
| a_00, |
| x_n_0, |
| y_t_0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x_n = sx_n->pa + xi_n; |
| REAL *x_t = sx_t->pa + xi_t; |
| REAL *y_n = sy_n->pa + yi_n; |
| REAL *y_t = sy_t->pa + yi_t; |
| REAL *z_n = sz_n->pa + zi_n; |
| REAL *z_t = sz_t->pa + zi_t; |
| for(ii=0; ii<m; ii++) |
| { |
| z_n[ii] = beta_n * y_n[ii]; |
| } |
| for(jj=0; jj<n; jj++) |
| { |
| y_t_0 = 0.0; |
| x_n_0 = alpha_n * x_n[jj]; |
| for(ii=0; ii<m; ii++) |
| { |
| a_00 = pA[ii+lda*jj]; |
| z_n[ii] += a_00 * x_n_0; |
| y_t_0 += a_00 * x_t[ii]; |
| } |
| z_t[jj] = beta_t * y_t[jj] + alpha_t * y_t_0; |
| } |
| return; |
| } |
| |
| |
| |
| // TODO optimize !!!!! |
| void SYMV_L_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi) |
| { |
| int ii, jj; |
| REAL |
| y_0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *y = sy->pa + yi; |
| REAL *z = sz->pa + zi; |
| for(ii=0; ii<n; ii++) |
| { |
| y_0 = 0.0; |
| jj = 0; |
| for(; jj<=ii; jj++) |
| { |
| y_0 += pA[ii+lda*jj] * x[jj]; |
| } |
| for( ; jj<m; jj++) |
| { |
| y_0 += pA[jj+lda*ii] * x[jj]; |
| } |
| z[ii] = beta * y[ii] + alpha * y_0; |
| } |
| return; |
| } |
| |
| |
| |
| void TRMV_LNN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| int ii, jj; |
| REAL |
| y_0, y_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| if(m-n>0) |
| { |
| GEMV_N_LIBSTR(m-n, n, 1.0, sA, ai+n, aj, sx, xi, 0.0, sz, zi+n, sz, zi+n); |
| } |
| if(n%2!=0) |
| { |
| ii = n-1; |
| y_0 = x[ii]; |
| y_0 *= pA[ii+lda*ii]; |
| for(jj=0; jj<ii; jj++) |
| { |
| y_0 += pA[ii+lda*jj] * x[jj]; |
| } |
| z[ii] = y_0; |
| n -= 1; |
| } |
| for(ii=n-2; ii>=0; ii-=2) |
| { |
| y_0 = x[ii+0]; |
| y_1 = x[ii+1]; |
| y_1 *= pA[ii+1+lda*(ii+1)]; |
| y_1 += pA[ii+1+lda*(ii+0)] * y_0; |
| y_0 *= pA[ii+0+lda*(ii+0)]; |
| jj = 0; |
| for(; jj<ii-1; jj+=2) |
| { |
| y_0 += pA[ii+0+lda*(jj+0)] * x[jj+0] + pA[ii+0+lda*(jj+1)] * x[jj+1]; |
| y_1 += pA[ii+1+lda*(jj+0)] * x[jj+0] + pA[ii+1+lda*(jj+1)] * x[jj+1]; |
| } |
| // XXX there is no clean up loop !!!!! |
| // for(; jj<ii; jj++) |
| // { |
| // y_0 += pA[ii+0+lda*jj] * x[jj]; |
| // y_1 += pA[ii+1+lda*jj] * x[jj]; |
| // } |
| z[ii+0] = y_0; |
| z[ii+1] = y_1; |
| } |
| return; |
| } |
| |
| |
| |
| void TRMV_LTN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| int ii, jj; |
| REAL |
| y_0, y_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| jj = 0; |
| for(; jj<n-1; jj+=2) |
| { |
| y_0 = x[jj+0]; |
| y_1 = x[jj+1]; |
| y_0 *= pA[jj+0+lda*(jj+0)]; |
| y_0 += pA[jj+1+lda*(jj+0)] * y_1; |
| y_1 *= pA[jj+1+lda*(jj+1)]; |
| ii = jj+2; |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 += pA[ii+0+lda*(jj+0)] * x[ii+0] + pA[ii+1+lda*(jj+0)] * x[ii+1]; |
| y_1 += pA[ii+0+lda*(jj+1)] * x[ii+0] + pA[ii+1+lda*(jj+1)] * x[ii+1]; |
| } |
| for(; ii<m; ii++) |
| { |
| y_0 += pA[ii+lda*(jj+0)] * x[ii]; |
| y_1 += pA[ii+lda*(jj+1)] * x[ii]; |
| } |
| z[jj+0] = y_0; |
| z[jj+1] = y_1; |
| } |
| for(; jj<n; jj++) |
| { |
| y_0 = x[jj]; |
| y_0 *= pA[jj+lda*jj]; |
| for(ii=jj+1; ii<m; ii++) |
| { |
| y_0 += pA[ii+lda*jj] * x[ii]; |
| } |
| z[jj] = y_0; |
| } |
| return; |
| } |
| |
| |
| |
| void TRMV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| int ii, jj; |
| REAL |
| y_0, y_1, |
| x_0, x_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| #if 1 // y reg version |
| jj = 0; |
| for(; jj<m-1; jj+=2) |
| { |
| y_0 = x[jj+0]; |
| y_1 = x[jj+1]; |
| y_0 = pA[jj+0+lda*(jj+0)] * y_0; |
| y_0 += pA[jj+0+lda*(jj+1)] * y_1; |
| y_1 = pA[jj+1+lda*(jj+1)] * y_1; |
| ii = jj+2; |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 += pA[jj+0+lda*(ii+0)] * x[ii+0] + pA[jj+0+lda*(ii+1)] * x[ii+1]; |
| y_1 += pA[jj+1+lda*(ii+0)] * x[ii+0] + pA[jj+1+lda*(ii+1)] * x[ii+1]; |
| } |
| if(ii<m) |
| { |
| y_0 += pA[jj+0+lda*(ii+0)] * x[ii+0]; |
| y_1 += pA[jj+1+lda*(ii+0)] * x[ii+0]; |
| } |
| z[jj+0] = y_0; |
| z[jj+1] = y_1; |
| } |
| for(; jj<m; jj++) |
| { |
| y_0 = pA[jj+lda*jj] * x[jj]; |
| for(ii=jj+1; ii<m; ii++) |
| { |
| y_0 += pA[jj+lda*ii] * x[ii]; |
| } |
| z[jj] = y_0; |
| } |
| #else // x reg version |
| if(x != z) |
| { |
| for(ii=0; ii<m; ii++) |
| z[ii] = x[ii]; |
| } |
| jj = 0; |
| for(; jj<m-1; jj+=2) |
| { |
| x_0 = z[jj+0]; |
| x_1 = z[jj+1]; |
| ii = 0; |
| for(; ii<jj-1; ii+=2) |
| { |
| z[ii+0] += pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1; |
| z[ii+1] += pA[ii+1+lda*(jj+0)] * x_0 + pA[ii+1+lda*(jj+1)] * x_1; |
| } |
| // XXX there is no clean-up loop, since jj+=2 !!!!! |
| // for(; ii<jj; ii++) |
| // { |
| // z[ii+0] += pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1; |
| // } |
| x_0 *= pA[jj+0+lda*(jj+0)]; |
| x_0 += pA[jj+0+lda*(jj+1)] * x_1; |
| x_1 *= pA[jj+1+lda*(jj+1)]; |
| z[jj+0] = x_0; |
| z[jj+1] = x_1; |
| } |
| for(; jj<m; jj++) |
| { |
| x_0 = z[jj]; |
| for(ii=0; ii<jj; ii++) |
| { |
| z[ii] += pA[ii+lda*jj] * x_0; |
| } |
| x_0 *= pA[jj+lda*jj]; |
| z[jj] = x_0; |
| } |
| #endif |
| return; |
| } |
| |
| |
| |
| void TRMV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| int ii, jj; |
| REAL |
| y_0, y_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| if(m%2!=0) |
| { |
| jj = m-1; |
| y_0 = pA[jj+lda*jj] * x[jj]; |
| for(ii=0; ii<jj; ii++) |
| { |
| y_0 += pA[ii+lda*jj] * x[ii]; |
| } |
| z[jj] = y_0; |
| m -= 1; // XXX |
| } |
| for(jj=m-2; jj>=0; jj-=2) |
| { |
| y_1 = pA[jj+1+lda*(jj+1)] * x[jj+1]; |
| y_1 += pA[jj+0+lda*(jj+1)] * x[jj+0]; |
| y_0 = pA[jj+0+lda*(jj+0)] * x[jj+0]; |
| for(ii=0; ii<jj-1; ii+=2) |
| { |
| y_0 += pA[ii+0+lda*(jj+0)] * x[ii+0] + pA[ii+1+lda*(jj+0)] * x[ii+1]; |
| y_1 += pA[ii+0+lda*(jj+1)] * x[ii+0] + pA[ii+1+lda*(jj+1)] * x[ii+1]; |
| } |
| // XXX there is no clean-up loop !!!!! |
| // if(ii<jj) |
| // { |
| // y_0 += pA[ii+lda*(jj+0)] * x[ii]; |
| // y_1 += pA[ii+lda*(jj+1)] * x[ii]; |
| // } |
| z[jj+0] = y_0; |
| z[jj+1] = y_1; |
| } |
| return; |
| } |
| |
| |
| |
| void TRSV_LNN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0 | n==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_lnn_mn_libstr : m<0 : %d<0 *****\n", m); |
| if(n<0) printf("\n****** trsv_lnn_mn_libstr : n<0 : %d<0 *****\n", n); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_lnn_mn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_lnn_mn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_lnn_mn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_lnn_mn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_lnn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+n > sA->n) printf("\n***** trsv_lnn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_lnn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_lnn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| int ii, jj, j1; |
| REAL |
| y_0, y_1, |
| x_0, x_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *dA = sA->dA; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| if(ai==0 & aj==0) |
| { |
| if(sA->use_dA!=1) |
| { |
| for(ii=0; ii<n; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 1; |
| } |
| } |
| else |
| { |
| for(ii=0; ii<n; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 0; |
| } |
| #if 1 // y reg version |
| ii = 0; |
| for(; ii<n-1; ii+=2) |
| { |
| y_0 = x[ii+0]; |
| y_1 = x[ii+1]; |
| jj = 0; |
| for(; jj<ii-1; jj+=2) |
| { |
| y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0] + pA[ii+0+lda*(jj+1)] * z[jj+1]; |
| y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0] + pA[ii+1+lda*(jj+1)] * z[jj+1]; |
| } |
| // XXX there is no clean-up loop !!!!! |
| // if(jj<ii) |
| // { |
| // y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0]; |
| // y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0]; |
| // } |
| y_0 *= dA[ii+0]; |
| y_1 -= pA[ii+1+lda*(jj+0)] * y_0; |
| y_1 *= dA[ii+1]; |
| z[ii+0] = y_0; |
| z[ii+1] = y_1; |
| } |
| for(; ii<n; ii++) |
| { |
| y_0 = x[ii]; |
| for(jj=0; jj<ii; jj++) |
| { |
| y_0 -= pA[ii+lda*jj] * z[jj]; |
| } |
| y_0 *= dA[ii]; |
| z[ii] = y_0; |
| } |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 = x[ii+0]; |
| y_1 = x[ii+1]; |
| jj = 0; |
| for(; jj<n-1; jj+=2) |
| { |
| y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0] + pA[ii+0+lda*(jj+1)] * z[jj+1]; |
| y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0] + pA[ii+1+lda*(jj+1)] * z[jj+1]; |
| } |
| if(jj<n) |
| { |
| y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0]; |
| y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0]; |
| } |
| z[ii+0] = y_0; |
| z[ii+1] = y_1; |
| } |
| for(; ii<m; ii++) |
| { |
| y_0 = x[ii]; |
| for(jj=0; jj<n; jj++) |
| { |
| y_0 -= pA[ii+lda*jj] * z[jj]; |
| } |
| z[ii] = y_0; |
| } |
| #else // x reg version |
| if(x != z) |
| { |
| for(ii=0; ii<m; ii++) |
| z[ii] = x[ii]; |
| } |
| jj = 0; |
| for(; jj<n-1; jj+=2) |
| { |
| x_0 = dA[jj+0] * z[jj+0]; |
| x_1 = z[jj+1] - pA[jj+1+lda*(jj+0)] * x_0; |
| x_1 = dA[jj+1] * x_1; |
| z[jj+0] = x_0; |
| z[jj+1] = x_1; |
| ii = jj+2; |
| for(; ii<m-1; ii+=2) |
| { |
| z[ii+0] -= pA[ii+0+lda*(jj+0)] * x_0 + pA[ii+0+lda*(jj+1)] * x_1; |
| z[ii+1] -= pA[ii+1+lda*(jj+0)] * x_0 + pA[ii+1+lda*(jj+1)] * x_1; |
| } |
| for(; ii<m; ii++) |
| { |
| z[ii] -= pA[ii+lda*(jj+0)] * x_0 + pA[ii+lda*(jj+1)] * x_1; |
| } |
| } |
| for(; jj<n; jj++) |
| { |
| x_0 = dA[jj] * z[jj]; |
| z[jj] = x_0; |
| for(ii=jj+1; ii<m; ii++) |
| { |
| z[ii] -= pA[ii+lda*jj] * x_0; |
| } |
| } |
| #endif |
| return; |
| } |
| |
| |
| |
| void TRSV_LTN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_ltn_mn_libstr : m<0 : %d<0 *****\n", m); |
| if(n<0) printf("\n****** trsv_ltn_mn_libstr : n<0 : %d<0 *****\n", n); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_ltn_mn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_ltn_mn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_ltn_mn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_ltn_mn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_ltn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+n > sA->n) printf("\n***** trsv_ltn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_ltn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_ltn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| int ii, jj; |
| REAL |
| y_0, y_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *dA = sA->dA; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| if(ai==0 & aj==0) |
| { |
| if(sA->use_dA!=1) |
| { |
| for(ii=0; ii<n; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 1; |
| } |
| } |
| else |
| { |
| for(ii=0; ii<n; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 0; |
| } |
| if(n%2!=0) |
| { |
| jj = n-1; |
| y_0 = x[jj]; |
| for(ii=jj+1; ii<m; ii++) |
| { |
| y_0 -= pA[ii+lda*jj] * z[ii]; |
| } |
| y_0 *= dA[jj]; |
| z[jj] = y_0; |
| jj -= 2; |
| } |
| else |
| { |
| jj = n-2; |
| } |
| for(; jj>=0; jj-=2) |
| { |
| y_0 = x[jj+0]; |
| y_1 = x[jj+1]; |
| ii = jj+2; |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 -= pA[ii+0+lda*(jj+0)] * z[ii+0] + pA[ii+1+lda*(jj+0)] * z[ii+1]; |
| y_1 -= pA[ii+0+lda*(jj+1)] * z[ii+0] + pA[ii+1+lda*(jj+1)] * z[ii+1]; |
| } |
| if(ii<m) |
| { |
| y_0 -= pA[ii+lda*(jj+0)] * z[ii]; |
| y_1 -= pA[ii+lda*(jj+1)] * z[ii]; |
| } |
| y_1 *= dA[jj+1]; |
| y_0 -= pA[jj+1+lda*(jj+0)] * y_1; |
| y_0 *= dA[jj+0]; |
| z[jj+0] = y_0; |
| z[jj+1] = y_1; |
| } |
| return; |
| } |
| |
| |
| |
| void TRSV_LNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_lnn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_lnn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_lnn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_lnn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_lnn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_lnn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_lnn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_lnn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_lnn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| int ii, jj, j1; |
| REAL |
| y_0, y_1, |
| x_0, x_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *dA = sA->dA; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| if(ai==0 & aj==0) |
| { |
| if(sA->use_dA!=1) |
| { |
| for(ii=0; ii<m; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 1; |
| } |
| } |
| else |
| { |
| for(ii=0; ii<m; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 0; |
| } |
| ii = 0; |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 = x[ii+0]; |
| y_1 = x[ii+1]; |
| jj = 0; |
| for(; jj<ii-1; jj+=2) |
| { |
| y_0 -= pA[ii+0+lda*(jj+0)] * z[jj+0] + pA[ii+0+lda*(jj+1)] * z[jj+1]; |
| y_1 -= pA[ii+1+lda*(jj+0)] * z[jj+0] + pA[ii+1+lda*(jj+1)] * z[jj+1]; |
| } |
| y_0 *= dA[ii+0]; |
| y_1 -= pA[ii+1+lda*(jj+0)] * y_0; |
| y_1 *= dA[ii+1]; |
| z[ii+0] = y_0; |
| z[ii+1] = y_1; |
| } |
| for(; ii<m; ii++) |
| { |
| y_0 = x[ii]; |
| for(jj=0; jj<ii; jj++) |
| { |
| y_0 -= pA[ii+lda*jj] * z[jj]; |
| } |
| y_0 *= dA[ii]; |
| z[ii] = y_0; |
| } |
| return; |
| } |
| |
| |
| |
| void TRSV_LNU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_lnu_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_lnu_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_lnu_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_lnu_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_lnu_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_lnu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_lnu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_lnu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_lnu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| printf("\n***** trsv_lnu_libstr : feature not implemented yet *****\n"); |
| exit(1); |
| } |
| |
| |
| |
| void TRSV_LTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_ltn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_ltn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_ltn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_ltn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_ltn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_ltn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_ltn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_ltn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_ltn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| int ii, jj; |
| REAL |
| y_0, y_1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *dA = sA->dA; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| if(ai==0 & aj==0) |
| { |
| if(sA->use_dA!=1) |
| { |
| for(ii=0; ii<m; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 1; |
| } |
| } |
| else |
| { |
| for(ii=0; ii<m; ii++) |
| dA[ii] = 1.0 / pA[ii+lda*ii]; |
| sA->use_dA = 0; |
| } |
| if(m%2!=0) |
| { |
| jj = m-1; |
| y_0 = x[jj]; |
| y_0 *= dA[jj]; |
| z[jj] = y_0; |
| jj -= 2; |
| } |
| else |
| { |
| jj = m-2; |
| } |
| for(; jj>=0; jj-=2) |
| { |
| y_0 = x[jj+0]; |
| y_1 = x[jj+1]; |
| ii = jj+2; |
| for(; ii<m-1; ii+=2) |
| { |
| y_0 -= pA[ii+0+lda*(jj+0)] * z[ii+0] + pA[ii+1+lda*(jj+0)] * z[ii+1]; |
| y_1 -= pA[ii+0+lda*(jj+1)] * z[ii+0] + pA[ii+1+lda*(jj+1)] * z[ii+1]; |
| } |
| if(ii<m) |
| { |
| y_0 -= pA[ii+lda*(jj+0)] * z[ii]; |
| y_1 -= pA[ii+lda*(jj+1)] * z[ii]; |
| } |
| y_1 *= dA[jj+1]; |
| y_0 -= pA[jj+1+lda*(jj+0)] * y_1; |
| y_0 *= dA[jj+0]; |
| z[jj+0] = y_0; |
| z[jj+1] = y_1; |
| } |
| return; |
| } |
| |
| |
| |
| void TRSV_LTU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_ltu_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_ltu_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_ltu_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_ltu_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_ltu_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_ltu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_ltu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_ltu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_ltu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| printf("\n***** trsv_ltu_libstr : feature not implemented yet *****\n"); |
| exit(1); |
| } |
| |
| |
| |
| void TRSV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_unn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_unn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_unn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_unn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_unn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_unn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_unn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_unn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_unn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| printf("\n***** trsv_unn_libstr : feature not implemented yet *****\n"); |
| exit(1); |
| } |
| |
| |
| |
| void TRSV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_utn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_utn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_utn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_utn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_utn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_utn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_utn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_utn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_utn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| printf("\n***** trsv_utn_libstr : feature not implemented yet *****\n"); |
| exit(1); |
| } |
| |
| |
| |
| #elif defined(LA_BLAS) |
| |
| |
| |
| void GEMV_N_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *y = sy->pa + yi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, y, &i1, z, &i1); |
| GEMV(&cn, &m, &n, &alpha, pA, &lda, x, &i1, &beta, z, &i1); |
| return; |
| } |
| |
| |
| |
| void GEMV_T_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *y = sy->pa + yi; |
| REAL *z = sz->pa + zi; |
| COPY(&n, y, &i1, z, &i1); |
| GEMV(&ct, &m, &n, &alpha, pA, &lda, x, &i1, &beta, z, &i1); |
| return; |
| } |
| |
| |
| |
| void GEMV_NT_LIBSTR(int m, int n, REAL alpha_n, REAL alpha_t, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx_n, int xi_n, struct STRVEC *sx_t, int xi_t, REAL beta_n, REAL beta_t, struct STRVEC *sy_n, int yi_n, struct STRVEC *sy_t, int yi_t, struct STRVEC *sz_n, int zi_n, struct STRVEC *sz_t, int zi_t) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x_n = sx_n->pa + xi_n; |
| REAL *x_t = sx_t->pa + xi_t; |
| REAL *y_n = sy_n->pa + yi_n; |
| REAL *y_t = sy_t->pa + yi_t; |
| REAL *z_n = sz_n->pa + zi_n; |
| REAL *z_t = sz_t->pa + zi_t; |
| COPY(&m, y_n, &i1, z_n, &i1); |
| GEMV(&cn, &m, &n, &alpha_n, pA, &lda, x_n, &i1, &beta_n, z_n, &i1); |
| COPY(&n, y_t, &i1, z_t, &i1); |
| GEMV(&ct, &m, &n, &alpha_t, pA, &lda, x_t, &i1, &beta_t, z_t, &i1); |
| return; |
| } |
| |
| |
| |
| void SYMV_L_LIBSTR(int m, int n, REAL alpha, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, REAL beta, struct STRVEC *sy, int yi, struct STRVEC *sz, int zi) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *y = sy->pa + yi; |
| REAL *z = sz->pa + zi; |
| int tmp = m-n; |
| COPY(&m, y, &i1, z, &i1); |
| SYMV(&cl, &n, &alpha, pA, &lda, x, &i1, &beta, z, &i1); |
| GEMV(&cn, &tmp, &n, &alpha, pA+n, &lda, x, &i1, &beta, z+n, &i1); |
| GEMV(&ct, &tmp, &n, &alpha, pA+n, &lda, x+n, &i1, &d1, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRMV_LNN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL d0 = 0.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| int tmp = m-n; |
| if(x!=z) |
| COPY(&n, x, &i1, z, &i1); |
| GEMV(&cn, &tmp, &n, &d1, pA+n, &lda, x, &i1, &d0, z+n, &i1); |
| TRMV(&cl, &cn, &cn, &n, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRMV_LTN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| int tmp = m-n; |
| if(x!=z) |
| COPY(&n, x, &i1, z, &i1); |
| TRMV(&cl, &ct, &cn, &n, pA, &lda, z, &i1); |
| GEMV(&ct, &tmp, &n, &d1, pA+n, &lda, x+n, &i1, &d1, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRMV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRMV(&cu, &cn, &cn, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRMV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRMV(&cu, &ct, &cn, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_LNN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0 | n==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_lnn_mn_libstr : m<0 : %d<0 *****\n", m); |
| if(n<0) printf("\n****** trsv_lnn_mn_libstr : n<0 : %d<0 *****\n", n); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_lnn_mn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_lnn_mn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_lnn_mn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_lnn_mn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_lnn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+n > sA->n) printf("\n***** trsv_lnn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_lnn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_lnn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int mmn = m-n; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRSV(&cl, &cn, &cn, &n, pA, &lda, z, &i1); |
| GEMV(&cn, &mmn, &n, &dm1, pA+n, &lda, z, &i1, &d1, z+n, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_LTN_MN_LIBSTR(int m, int n, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_ltn_mn_libstr : m<0 : %d<0 *****\n", m); |
| if(n<0) printf("\n****** trsv_ltn_mn_libstr : n<0 : %d<0 *****\n", n); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_ltn_mn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_ltn_mn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_ltn_mn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_ltn_mn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_ltn_mn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+n > sA->n) printf("\n***** trsv_ltn_mn_libstr : aj+n > col(A) : %d+%d > %d *****\n", aj, n, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_ltn_mn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_ltn_mn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int mmn = m-n; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| GEMV(&ct, &mmn, &n, &dm1, pA+n, &lda, z+n, &i1, &d1, z, &i1); |
| TRSV(&cl, &ct, &cn, &n, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_LNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_lnn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_lnn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_lnn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_lnn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_lnn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_lnn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_lnn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_lnn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_lnn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRSV(&cl, &cn, &cn, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_LNU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_lnu_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_lnu_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_lnu_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_lnu_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_lnu_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_lnu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_lnu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_lnu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_lnu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRSV(&cl, &cn, &cu, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_LTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_ltn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_ltn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_ltn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_ltn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_ltn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_ltn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_ltn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_ltn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_ltn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRSV(&cl, &ct, &cn, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_LTU_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_ltu_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_ltu_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_ltu_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_ltu_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_ltu_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_ltu_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_ltu_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_ltu_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_ltu_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRSV(&cl, &ct, &cu, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_UNN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_unn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_unn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_unn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_unn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_unn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_unn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_unn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_unn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_unn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRSV(&cu, &cn, &cn, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| void TRSV_UTN_LIBSTR(int m, struct STRMAT *sA, int ai, int aj, struct STRVEC *sx, int xi, struct STRVEC *sz, int zi) |
| { |
| if(m==0) |
| return; |
| #if defined(DIM_CHECK) |
| // non-negative size |
| if(m<0) printf("\n****** trsv_utn_libstr : m<0 : %d<0 *****\n", m); |
| // non-negative offset |
| if(ai<0) printf("\n****** trsv_utn_libstr : ai<0 : %d<0 *****\n", ai); |
| if(aj<0) printf("\n****** trsv_utn_libstr : aj<0 : %d<0 *****\n", aj); |
| if(xi<0) printf("\n****** trsv_utn_libstr : xi<0 : %d<0 *****\n", xi); |
| if(zi<0) printf("\n****** trsv_utn_libstr : zi<0 : %d<0 *****\n", zi); |
| // inside matrix |
| // A: m x k |
| if(ai+m > sA->m) printf("\n***** trsv_utn_libstr : ai+m > row(A) : %d+%d > %d *****\n", ai, m, sA->m); |
| if(aj+m > sA->n) printf("\n***** trsv_utn_libstr : aj+m > col(A) : %d+%d > %d *****\n", aj, m, sA->n); |
| // x: m |
| if(xi+m > sx->m) printf("\n***** trsv_utn_libstr : xi+m > size(x) : %d+%d > %d *****\n", xi, m, sx->m); |
| // z: m |
| if(zi+m > sz->m) printf("\n***** trsv_utn_libstr : zi+m > size(z) : %d+%d > %d *****\n", zi, m, sz->m); |
| #endif |
| char cl = 'l'; |
| char cn = 'n'; |
| char cr = 'r'; |
| char ct = 't'; |
| char cu = 'u'; |
| int i1 = 1; |
| REAL d1 = 1.0; |
| REAL dm1 = -1.0; |
| int lda = sA->m; |
| REAL *pA = sA->pA + ai + aj*lda; |
| REAL *x = sx->pa + xi; |
| REAL *z = sz->pa + zi; |
| COPY(&m, x, &i1, z, &i1); |
| TRSV(&cu, &ct, &cn, &m, pA, &lda, z, &i1); |
| return; |
| } |
| |
| |
| |
| #else |
| |
| #error : wrong LA choice |
| |
| #endif |
| |
| |