https://github.com/Microsoft/CNTK
Raw File
Tip revision: 13862788278f0a22aef6e1b21cea2b36e916a767 authored by Vadim Mazalov on 10 January 2020, 01:27:22 UTC
Enable cuda evaluation of RNNT models
Tip revision: 1386278
MatrixQuantizerCPU.h
#pragma once

#include "MatrixQuantizerImpl.h"
#include "ColumnQuantizer.h"
#include "QuantizedMatrix.h"
#include "CPUMatrix.h"

#ifdef _WIN32
#ifdef MATH_EXPORTS
#define MATH_API __declspec(dllexport)
#else
#define MATH_API __declspec(dllimport)
#endif
#else // no DLLs on Linux
#define MATH_API
#endif

namespace Microsoft { namespace MSR { namespace CNTK {

//see dbn::matrix quantizer
template <class ElemType>
class MatrixQuantizerCPU final : public MatrixQuantizerImpl<ElemType>
{
public:
    MatrixQuantizerCPU();

    // Disallow copy construction and assignment
    MatrixQuantizerCPU(const MatrixQuantizerCPU&) = delete;
    MatrixQuantizerCPU& operator=(const MatrixQuantizerCPU&) = delete;

    void QuantizeAsync(const Matrix<ElemType>& inMatrix, const Matrix<ElemType>& inResidual, QuantizedMatrix<ElemType>& outQMatrix, Matrix<ElemType>& outResidual, bool zeroThresholdFor1Bit) override;
    void WaitQuantizeAsyncDone() override;

    void UnquantizeAsync(QuantizedMatrix<ElemType>& inQMatrix, Matrix<ElemType>& outMatrix, bool add = false) override;
    void WaitUnquantizeAsyncDone() override;
};
} } }
back to top