📄 dbcovml.c
字号:
/*-------------------------------------------------------|| NIST SPARSE BLAS v. 0.9 (Sat Jul 6 14:27:21 EDT 1996) || || Authors: || Karin A. Remington and Roldan Pozo || National Institute of Standards and Technology || || Based on the interface standard proposed in: | | "A Revised Proposal for a Sparse BLAS Toolkit" by || S. Carney and K. Wu -- University of Minnesota || M. Heroux and G. Li -- Cray Research | | R. Pozo and K.A. Remington -- NIST || || Contact: || Karin A. Remington, email: kremington@nist.gov |--------------------------------------------------------*//* Created: Sat Jul 6 14:32:53 EDT 1996 */#include "dbcovml.h"void BCO_VecMult_CAB_double( const int mb, const int kb, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; int i,j,jb,je,block; int cs,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=m;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; pval = &val[i*mm]; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] += t* (*pval++); } } else { pval+=lb; } } }}void BCO_VecMult_CATB_double( const int mb, const int kb, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; int i,j,jb,je,block; int cs,bs,cr; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=k;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bjndx[i]-1)*lb; bs = (bindx[i]-1)*lb; pval = &val[i*mm]; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { t = 0; for (ii=0;ii!=lb;ii++) { t += pb[ii] * (*pval++); } pc[jj] += t; } } }void BCOsymm_VecMult_CAB_double( const int mb, const int kb, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; const double *ptmp; int i,j,jb,je,block; int cs,css,cr,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=m;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; pval = &val[i*mm]; ptmp = pval; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] += t* (*pval++); } } else { pval+=lb; } } if ( cs == bs ) { continue; } pval = ptmp; pb = &b[cs]; pc = &c[bs]; for (jj=0;jj!=lb;jj++) { t = 0; for (ii=0;ii!=lb;ii++) { t += pb[ii] * (*pval++); } pc[jj] += t; } }}void BCOskew_VecMult_CAB_double( const int mb, const int kb, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; const double *ptmp; int i,j,jb,je,block; int cs,css,cr,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=m;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; if ( cs == bs ) { continue; } pval = &val[i*mm]; ptmp = pval; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] += t* (*pval++); } } else { pval+=lb; } } pval = ptmp; pb = &b[cs]; pc = &c[bs]; for (jj=0;jj!=lb;jj++) { t = 0; for (ii=0;ii!=lb;ii++) { t -= pb[ii] * (*pval++); } pc[jj] += t; } }}void BCOskew_VecMult_CATB_double( const int mb, const int kb, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; int i,j,jb,je,block; int cs,css,cr,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; const double *ptmp; for (i=0;i!=k;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; if ( cs == bs ) { continue; } pval = &val[i*mm]; ptmp = pval; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] -= t* (*pval++); } } else { pval+=lb; } } pval = ptmp; pb = &b[cs]; pc = &c[bs]; for (jj=0;jj!=lb;jj++) { t = 0; for (ii=0;ii!=lb;ii++) { t += pb[ii] * (*pval++); } pc[jj] += t; } }}void BCO_VecMult_CaAB_double( const int mb, const int kb, const double alpha, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; int i,j,jb,je,block; int cs,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=m;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; pval = &val[i*mm]; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = alpha * pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] += t* (*pval++); } } else { pval+=lb; } } }}void BCO_VecMult_CaATB_double( const int mb, const int kb, const double alpha, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; int i,j,jb,je,block; int cs,bs,cr; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=k;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bjndx[i]-1)*lb; bs = (bindx[i]-1)*lb; pval = &val[i*mm]; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { t = 0; for (ii=0;ii!=lb;ii++) { t += alpha * pb[ii] * (*pval++); } pc[jj] += t; } } }void BCOsymm_VecMult_CaAB_double( const int mb, const int kb, const double alpha, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; const double *ptmp; int i,j,jb,je,block; int cs,css,cr,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=m;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; pval = &val[i*mm]; ptmp = pval; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = alpha * pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] += t* (*pval++); } } else { pval+=lb; } } if ( cs == bs ) { continue; } pval = ptmp; pb = &b[cs]; pc = &c[bs]; for (jj=0;jj!=lb;jj++) { t = 0; for (ii=0;ii!=lb;ii++) { t += alpha * pb[ii] * (*pval++); } pc[jj] += t; } }}void BCOskew_VecMult_CaAB_double( const int mb, const int kb, const double alpha, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; const double *ptmp; int i,j,jb,je,block; int cs,css,cr,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; for (i=0;i!=m;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; if ( cs == bs ) { continue; } pval = &val[i*mm]; ptmp = pval; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = alpha * pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] += t* (*pval++); } } else { pval+=lb; } } pval = ptmp; pb = &b[cs]; pc = &c[bs]; for (jj=0;jj!=lb;jj++) { t = 0; for (ii=0;ii!=lb;ii++) { t -= alpha * pb[ii] * (*pval++); } pc[jj] += t; } }}void BCOskew_VecMult_CaATB_double( const int mb, const int kb, const double alpha, const double *val, const int *bindx, const int *bjndx, const int bnnz, const int lb, const double *b, double *c, const int ind_base){ double t; const double *pb; double *pc=c; const double *pval; int i,j,jb,je,block; int cs,css,cr,bs,br; int index; int ii,jj; int m=mb*lb; int k=kb*lb; int mm=lb*lb; const double *ptmp; for (i=0;i!=k;i++) *pc++ = 0; for (i=0;i!=bnnz;i++) { cs = (bindx[i]-1)*lb; bs = (bjndx[i]-1)*lb; if ( cs == bs ) { continue; } pval = &val[i*mm]; ptmp = pval; pb = &b[bs]; pc = &c[cs]; for (jj=0;jj!=lb;jj++) { if( pb[jj] != 0.0 ) { t = alpha * pb[jj]; for (ii=0;ii!=lb;ii++) { pc[ii] -= t* (*pval++); } } else { pval+=lb;
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -