https://hal.archives-ouvertes.fr/hal-02128878
Raw File
Tip revision: 4201397494d9af8b687117e8ff4d85a8944f5c5a authored by Software Heritage on 11 June 2019, 10:15:02 UTC
hal: Deposit 298 in collection hal
Tip revision: 4201397
fflas_faxpy.inl
/* fflas/fflas_faxpy.inl
 * Copyright (C) 2005 Clement Pernet
 *
 * Written by Clement Pernet <Clement.Pernet@imag.fr>
 *
 *
 * ========LICENCE========
 * This file is part of the library FFLAS-FFPACK.
 *
 * FFLAS-FFPACK is free software: you can redistribute it and/or modify
 * it under the terms of the  GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 * ========LICENCE========
 *.
 */

#ifndef __FFLASFFPACK_faxpy_INL
#define __FFLASFFPACK_faxpy_INL



namespace FFLAS {

    template<class Field>
    inline void
    faxpy( const Field& F, const size_t N,
           const typename Field::Element a,
           typename Field::ConstElement_ptr X, const size_t incX,
           typename Field::Element_ptr Y, const size_t incY )
    {

        if (F.isZero(a))
            return ;

        if (F.isOne(a))
            return faddin(F,N,X,incX,Y,incY);
        //return fassign(F,N,X,incX,Y,incY);

        if (F.isMOne(a))
            return fsubin(F,N,X,incX,Y,incY);
        //return fneg(F,N,X,incX,Y,incY);

        typename Field::ConstElement_ptr Xi = X;
        typename Field::Element_ptr Yi=Y;
        for (; Xi < X+N*incX; Xi+=incX, Yi+=incY )
            F.axpyin( *Yi, a, *Xi );
    }

    template<>
    inline void
    faxpy( const Givaro::DoubleDomain& , const size_t N,
           const Givaro::DoubleDomain::Element a,
           Givaro::DoubleDomain::ConstElement_ptr x, const size_t incx,
           Givaro::DoubleDomain::Element_ptr y, const size_t incy )
    {

#if defined(__FFLASFFPACK_OPENBLAS_NUM_THREADS) and not defined (__FFLASFFPACK_OPENBLAS_NT_ALREADY_SET)
        openblas_set_num_threads(__FFLASFFPACK_OPENBLAS_NUM_THREADS);
#endif
        cblas_daxpy( (int)N, a, x, (int)incx, y, (int)incy);
    }

    template<>
    inline void
    faxpy( const Givaro::FloatDomain& , const size_t N,
           const Givaro::FloatDomain::Element a,
           Givaro::FloatDomain::ConstElement_ptr x, const size_t incx,
           Givaro::FloatDomain::Element_ptr y, const size_t incy )
    {

#if defined(__FFLASFFPACK_OPENBLAS_NUM_THREADS) and not defined (__FFLASFFPACK_OPENBLAS_NT_ALREADY_SET)
        openblas_set_num_threads(__FFLASFFPACK_OPENBLAS_NUM_THREADS);
#endif
        cblas_saxpy( (int)N, a, x, (int)incx, y, (int)incy);
    }

    template<class Field>
    inline void
    faxpy( const Field& F, const size_t m, const size_t n,
           const typename Field::Element a,
           typename Field::ConstElement_ptr X, const size_t ldX,
           typename Field::Element_ptr Y, const size_t ldY )
    {

        if (F.isZero(a))
            return ;

        if (F.isOne(a))
            return faddin(F,m,n,X,ldX,Y,ldY);
        //return fassign(F,m,n,X,ldX,Y,ldY);

        if (F.isMOne(a))
            return fsubin(F,m,n,X,ldX,Y,ldY);
        //return fneg(F,m,n,X,ldX,Y,ldY);

        if (n == ldX && n == ldY)
            return faxpy(F,m*n,a,X,1,Y,1);

        typename Field::ConstElement_ptr Xi = X;
        typename Field::Element_ptr Yi=Y;
        for (; Xi < X+m*ldX; Xi+=ldX, Yi+=ldY )
            faxpy(F,n,a,Xi,1,Yi,1);
    }

} // FFLAS

#endif // __FFLASFFPACK_faxpy_INL
/* -*- mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
// vim:sts=4:sw=4:ts=4:et:sr:cino=>s,f0,{0,g0,(0,\:0,t0,+0,=s
back to top