https://hal.archives-ouvertes.fr/hal-02128878
Raw File
Tip revision: 4201397494d9af8b687117e8ff4d85a8944f5c5a authored by Software Heritage on 11 June 2019, 10:15:02 UTC
hal: Deposit 298 in collection hal
Tip revision: 4201397
fflas_fscal_mp.inl
/*
 * Copyright (C) 2014 FFLAS-FFPACK group
 *
 * Written by Pascal Giorgi <pascal.giorgi@lirmm.fr>
 *
 *
 * ========LICENCE========
 * This file is part of the library FFLAS-FFPACK.
 *
 * FFLAS-FFPACK is free software: you can redistribute it and/or modify
 * it under the terms of the  GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 * ========LICENCE========
 *.
 */

#ifndef __FFLASFFPACK_fscal_mp_INL
#define __FFLASFFPACK_fscal_mp_INL

#include "fflas-ffpack/field/rns-integer.h"
#include "fflas_fscal.h"
#include "fflas_fgemm.inl"
namespace FFLAS {

    /*
     *  specialization for the field RNSInteger<rns_double>
     */

    // level 1 : fscalin
    template<>
    inline void fscalin(const FFPACK::RNSInteger<FFPACK::rns_double> &F,  const size_t n,
                        const FFPACK::rns_double::Element alpha,
                        FFPACK::rns_double::Element_ptr A, const size_t inc)
    {
        for (size_t i=0;i<F.size();i++)
            fscalin(F.rns()._field_rns[i], n, alpha._ptr[i*alpha._stride], A._ptr+i*A._stride,inc);
    }
    // level 1 : fscal
    template<>
    inline void fscal(const FFPACK::RNSInteger<FFPACK::rns_double> &F,  const size_t n,
                      const FFPACK::rns_double::Element alpha,
                      FFPACK::rns_double::ConstElement_ptr A, const size_t Ainc,
                      FFPACK::rns_double::Element_ptr B, const size_t Binc)
    {
        for (size_t i=0;i<F.size();i++)
            fscal(F.rns()._field_rns[i], n, alpha._ptr[i*alpha._stride], A._ptr+i*A._stride,Ainc, B._ptr+i*B._stride,Binc);
    }
    // level 2 : fscalin
    template<>
    inline void fscalin(const FFPACK::RNSInteger<FFPACK::rns_double> &F,  const size_t m, const size_t n,
                        const FFPACK::rns_double::Element alpha,
                        FFPACK::rns_double::Element_ptr A, const size_t lda) {
        for (size_t i=0;i<F.size();i++)
            fscalin(F.rns()._field_rns[i], m, n, alpha._ptr[i*alpha._stride], A._ptr+i*A._stride,lda);
    }
    // level 2 : fscal
    template<>
    inline void fscal(const FFPACK::RNSInteger<FFPACK::rns_double> &F, const size_t m, const size_t n,
                      const FFPACK::rns_double::Element alpha,
                      FFPACK::rns_double::ConstElement_ptr A, const size_t lda,
                      FFPACK::rns_double::Element_ptr B, const size_t ldb) {
        for (size_t i=0;i<F.size();i++)
            fscal(F.rns()._field_rns[i], m, n, alpha._ptr[i*alpha._stride], A._ptr+i*A._stride, lda, B._ptr+i*B._stride, ldb);

    }
}

#include "fflas-ffpack/fflas/fflas_freduce_mp.inl"

namespace FFLAS {
    /*
     *  specialization for the field RNSIntegerMod<rns_double>
     */

    // level 1 : fscalin
    template<>
    inline void fscalin(const FFPACK::RNSIntegerMod<FFPACK::rns_double> &F,  const size_t n,
                        const typename FFPACK::RNSIntegerMod<FFPACK::rns_double>::Element alpha,
                        typename FFPACK::RNSIntegerMod<FFPACK::rns_double>::Element_ptr A, const size_t inc)
    {
        fscalin(F.delayed(),n,alpha,A,inc);
        freduce (F, n, A, inc);
    }
    // level 1 : fscal
    template<>
    inline void fscal(const FFPACK::RNSIntegerMod<FFPACK::rns_double> &F,  const size_t n,
                      const FFPACK::rns_double::Element alpha,
                      FFPACK::rns_double::ConstElement_ptr A, const size_t Ainc,
                      FFPACK::rns_double::Element_ptr B, const size_t Binc)
    {
        fscal(F.delayed(),n,alpha,A,Ainc,B,Binc);
        freduce (F, n, B, Binc);
    }
    // level 2 : fscalin
    template<>
    inline void fscalin(const FFPACK::RNSIntegerMod<FFPACK::rns_double> &F,  const size_t m, const size_t n,
                        const FFPACK::rns_double::Element alpha,
                        FFPACK::rns_double::Element_ptr A, const size_t lda)
    {
        fscalin(F.delayed(),m,n,alpha,A,lda);
        freduce (F, m, n, A, lda);
    }
    // level 2 : fscal
    template<>
    inline void fscal(const FFPACK::RNSIntegerMod<FFPACK::rns_double> &F, const size_t m, const size_t n,
                      const FFPACK::rns_double::Element alpha,
                      FFPACK::rns_double::ConstElement_ptr A, const size_t lda,
                      FFPACK::rns_double::Element_ptr B, const size_t ldb)
    {
        fscal(F.delayed(),m,n,alpha,A,lda,B,ldb);
        freduce (F, m, n, B, ldb);
    }

} //end of namespace FFLAS


#endif

/* -*- mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
// vim:sts=4:sw=4:ts=4:et:sr:cino=>s,f0,{0,g0,(0,\:0,t0,+0,=s
back to top