atl_trputu.c

来自「基于Blas CLapck的.用过的人知道是干啥的」· C语言 代码 · 共 134 行

C
134
字号
/* *             Automatically Tuned Linear Algebra Software v3.8.0 *                    (C) Copyright 1997 R. Clint Whaley * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: *   1. Redistributions of source code must retain the above copyright *      notice, this list of conditions and the following disclaimer. *   2. Redistributions in binary form must reproduce the above copyright *      notice, this list of conditions, and the following disclaimer in the *      documentation and/or other materials provided with the distribution. *   3. The name of the ATLAS group or the names of its contributers may *      not be used to endorse or promote products derived from this *      software without specific written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE ATLAS GROUP OR ITS CONTRIBUTORS * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. * */#include "atlas_kern3.h"#ifdef TREALvoid Mjoin(Mjoin(PATL,trputU),BNM)   (const int N, const TYPE *v, const SCALAR beta0, TYPE *A, const int lda)/* * Writes the upper part of an NxN workspace v to the upper part of the array A */{   register int i, j;   const register SCALAR beta=beta0;   for (j=0; j != N; j++)   {      for (i=0; i <= j; i++)         #if defined(BETA1)            A[i] += v[i];         #elif defined(BETA0)            A[i] = v[i];         #else            A[i] = beta*A[i] + v[i];         #endif      v += N;      A += lda;   }}#else#ifdef Herm_   void Mjoin(Mjoin(PATL,heputU),BNM)#else   void Mjoin(Mjoin(PATL,trputU),BNM)#endif   (const int N, const TYPE *v, const SCALAR beta0, TYPE *A, const int lda)/* * Writes the upper part of an NxN workspace v to the upper part of the array A */{   int i, j2;   const int N2=N<<1, lda2=lda<<1;   #ifdef Herm_      const TYPE zero=0.0;   #endif   #ifdef BETAXI0      const register TYPE rbeta=*beta0;   #elif defined(BETAX)      register TYPE ra, ia;      const register TYPE rbeta=*beta0, ibeta=beta0[1];   #endif   for (j2=0; j2 != N2; j2 += 2)   {      #ifdef BETA1         for (i=0; i != j2; i++) A[i] += v[i];         A[j2] += v[j2];         #ifdef Herm_            A[j2+1] = zero;         #else            A[j2+1] += v[j2+1];         #endif      #elif defined(BETA0)         for (i=0; i != j2; i++) A[i] = v[i];         A[j2] = v[j2];         #ifdef Herm_            A[j2+1] = zero;         #else            A[j2+1] = v[j2+1];         #endif      #elif defined(BETAN1) || defined(BETAXI0)         for (i=0; i != j2; i++) A[i] = ATL_MulByBETA(A[i]) + v[i];         A[j2] = ATL_MulByBETA(A[j2]) + v[j2];         #ifdef Herm_            A[j2+1] = zero;         #else            A[j2+1] = ATL_MulByBETA(A[j2+1]) + v[j2+1];         #endif      #else/* *       Last iteration unrolled to get around compiler error on IA64 */         for (i=0; i != j2; i += 2)         {            ra = A[i];            ia = A[i+1];            A[i] = ra*rbeta - ia*ibeta + v[i];            A[i+1] = ra*ibeta + ia*rbeta + v[i+1];         }         #ifdef Herm_            #error "Hermitian matrix must have real BETA"         #else            ra = A[j2];            ia = A[j2+1];            A[j2] = ra*rbeta - ia*ibeta + v[j2];            A[j2+1] = ra*ibeta + ia*rbeta + v[j2+1];         #endif      #endif      v += N2;      A += lda2;   }}#endif

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?