///////////////////////////////////////////////////////////////////////////////////
// Copyright (C) 2015 Edouard Griffiths, F4EXB                                   //
//                                                                               //
// This program is free software; you can redistribute it and/or modify          //
// it under the terms of the GNU General Public License as published by          //
// the Free Software Foundation as version 3 of the License, or                  //
// (at your option) any later version.                                           //
//                                                                               //
// This program is distributed in the hope that it will be useful,               //
// but WITHOUT ANY WARRANTY; without even the implied warranty of                //
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the                  //
// GNU General Public License V3 for more details.                               //
//                                                                               //
// You should have received a copy of the GNU General Public License             //
// along with this program. If not, see .          //
///////////////////////////////////////////////////////////////////////////////////
#ifndef INCLUDE_DSP_SAMPLESINKFIFODECIMATOR_H_
#define INCLUDE_DSP_SAMPLESINKFIFODECIMATOR_H_
#include 
#include "dsp/dsptypes.h"
#include "dsp/inthalfbandfilter.h"
#include "samplesinkfifodoublebuffered.h"
template
struct decimation_shifts
{
    static const uint32_t pre1   = 0;
    static const uint32_t pre2   = 0;
    static const uint32_t post2  = 0;
    static const uint32_t pre4   = 0;
    static const uint32_t post4  = 0;
    static const uint32_t pre8   = 0;
    static const uint32_t post8  = 0;
    static const uint32_t pre16  = 0;
    static const uint32_t post16 = 0;
    static const uint32_t pre32  = 0;
    static const uint32_t post32 = 0;
    static const uint32_t pre64  = 0;
    static const uint32_t post64 = 0;
};
template<>
struct decimation_shifts<16, 16>
{
    static const uint32_t pre1   = 0;
    static const uint32_t pre2   = 0;
    static const uint32_t post2  = 1;
    static const uint32_t pre4   = 0;
    static const uint32_t post4  = 2;
    static const uint32_t pre8   = 0;
    static const uint32_t post8  = 3;
    static const uint32_t pre16  = 0;
    static const uint32_t post16 = 4;
    static const uint32_t pre32  = 0;
    static const uint32_t post32 = 5;
    static const uint32_t pre64  = 0;
    static const uint32_t post64 = 6;
};
template<>
struct decimation_shifts<16, 12>
{
    static const uint32_t pre1   = 4;
    static const uint32_t pre2   = 3;
    static const uint32_t post2  = 0;
    static const uint32_t pre4   = 2;
    static const uint32_t post4  = 0;
    static const uint32_t pre8   = 1;
    static const uint32_t post8  = 0;
    static const uint32_t pre16  = 0;
    static const uint32_t post16 = 0;
    static const uint32_t pre32  = 0;
    static const uint32_t post32 = 1;
    static const uint32_t pre64  = 0;
    static const uint32_t post64 = 2;
};
template<>
struct decimation_shifts<16, 8>
{
    static const uint32_t pre1   = 6;
    static const uint32_t pre2   = 5;
    static const uint32_t post2  = 0;
    static const uint32_t pre4   = 4;
    static const uint32_t post4  = 0;
    static const uint32_t pre8   = 3;
    static const uint32_t post8  = 0;
    static const uint32_t pre16  = 2;
    static const uint32_t post16 = 0;
    static const uint32_t pre32  = 1;
    static const uint32_t post32 = 0;
    static const uint32_t pre64  = 0;
    static const uint32_t post64 = 0;
};
template
class SampleSinkFifoDecimator
{
public:
	void decimate1(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate2_u(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate2_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate2_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate2_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate4_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate4_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate4_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate8_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate8_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate8_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate16_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate16_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate16_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate32_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate32_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate32_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate64_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate64_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
	void decimate64_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len);
private:
	IntHalfbandFilter m_decimator2;  // 1st stages
	IntHalfbandFilter m_decimator4;  // 2nd stages
	IntHalfbandFilter m_decimator8;  // 3rd stages
	IntHalfbandFilter m_decimator16; // 4th stages
	IntHalfbandFilter m_decimator32; // 5th stages
	IntHalfbandFilter m_decimator64; // 6th stages
};
template
void SampleSinkFifoDecimator::decimate1(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal, yimag;
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 1; pos += 2)
	{
		xreal = buf[pos+0];
		yimag = buf[pos+1];
		(*it).setReal(xreal << decimation_shifts::pre1); // Valgrind optim (2 - comment not repeated)
		(*it).setImag(yimag << decimation_shifts::pre1);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate2_u(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal, yimag;
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 7; pos += 8)
	{
		xreal = (buf[pos+0] - buf[pos+3]) << decimation_shifts::pre2;
		yimag = (buf[pos+1] + buf[pos+2] - 255) << decimation_shifts::pre2;
		(*it).setReal(xreal >> decimation_shifts::post2);
		(*it).setImag(yimag >> decimation_shifts::post2);
		fifo.bumpIndex(it);
		xreal = (buf[pos+7] - buf[pos+4]) << decimation_shifts::pre2;
		yimag = (255 - buf[pos+5] - buf[pos+6]) << decimation_shifts::pre2;
		(*it).setReal(xreal >> decimation_shifts::post2);
		(*it).setImag(yimag >> decimation_shifts::post2);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate2_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal, yimag;
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 7; pos += 8)
	{
		xreal = (buf[pos+0] - buf[pos+3]) << decimation_shifts::pre2;
		yimag = (buf[pos+1] + buf[pos+2]) << decimation_shifts::pre2;
		(*it).setReal(xreal >> decimation_shifts::post2);
		(*it).setImag(yimag >> decimation_shifts::post2);
		fifo.bumpIndex(it);
		xreal = (buf[pos+7] - buf[pos+4]) << decimation_shifts::pre2;
		yimag = (- buf[pos+5] - buf[pos+6]) << decimation_shifts::pre2;
		(*it).setReal(xreal >> decimation_shifts::post2);
		(*it).setImag(yimag >> decimation_shifts::post2);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate2_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal, yimag;
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 7; pos += 8)
	{
		xreal = (buf[pos+1] - buf[pos+2]) << decimation_shifts::pre2;
		yimag = (- buf[pos+0] - buf[pos+3]) << decimation_shifts::pre2;
		(*it).setReal(xreal >> decimation_shifts::post2);
		(*it).setImag(yimag >> decimation_shifts::post2);
		fifo.bumpIndex(it);
		xreal = (buf[pos+6] - buf[pos+5]) << decimation_shifts::pre2;
		yimag = (buf[pos+4] + buf[pos+7]) << decimation_shifts::pre2;
		(*it).setReal(xreal >> decimation_shifts::post2);
		(*it).setImag(yimag >> decimation_shifts::post2);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate4_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal, yimag;
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 7; pos += 8)
	{
		xreal = (buf[pos+0] - buf[pos+3] + buf[pos+7] - buf[pos+4]) << decimation_shifts::pre4;
		yimag = (buf[pos+1] - buf[pos+5] + buf[pos+2] - buf[pos+6]) << decimation_shifts::pre4;
		(*it).setReal(xreal >> decimation_shifts::post4);
		(*it).setImag(yimag >> decimation_shifts::post4);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate4_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	// Sup (USB):
	//            x  y   x  y   x   y  x   y  / x -> 1,-2,-5,6 / y -> -0,-3,4,7
	// [ rotate:  1, 0, -2, 3, -5, -4, 6, -7]
	// Inf (LSB):
	//            x  y   x  y   x   y  x   y  / x -> 0,-3,-4,7 / y -> 1,2,-5,-6
	// [ rotate:  0, 1, -3, 2, -4, -5, 7, -6]
	qint32 xreal, yimag;
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 7; pos += 8)
	{
		xreal = (buf[pos+1] - buf[pos+2] - buf[pos+5] + buf[pos+6]) << decimation_shifts::pre4;
		yimag = (- buf[pos+0] - buf[pos+3] + buf[pos+4] + buf[pos+7]) << decimation_shifts::pre4;
		(*it).setReal(xreal >> decimation_shifts::post4);
		(*it).setImag(yimag >> decimation_shifts::post4);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate8_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal[2], yimag[2];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 15; pos += 8)
	{
		xreal[0] = (buf[pos+0] - buf[pos+3] + buf[pos+7] - buf[pos+4]) << decimation_shifts::pre8;
		yimag[0] = (buf[pos+1] - buf[pos+5] + buf[pos+2] - buf[pos+6]) << decimation_shifts::pre8;
		pos += 8;
		xreal[1] = (buf[pos+0] - buf[pos+3] + buf[pos+7] - buf[pos+4]) << decimation_shifts::pre8;
		yimag[1] = (buf[pos+1] - buf[pos+5] + buf[pos+2] - buf[pos+6]) << decimation_shifts::pre8;
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		(*it).setReal(xreal[1] >> decimation_shifts::post8);
		(*it).setImag(yimag[1] >> decimation_shifts::post8);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate8_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal[2], yimag[2];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 15; pos += 8)
	{
		xreal[0] = (buf[pos+1] - buf[pos+2] - buf[pos+5] + buf[pos+6]) << decimation_shifts::pre8;
		yimag[0] = (- buf[pos+0] - buf[pos+3] + buf[pos+4] + buf[pos+7]) << decimation_shifts::pre8;
		pos += 8;
		xreal[1] = (buf[pos+1] - buf[pos+2] - buf[pos+5] + buf[pos+6]) << decimation_shifts::pre8;
		yimag[1] = (- buf[pos+0] - buf[pos+3] + buf[pos+4] + buf[pos+7]) << decimation_shifts::pre8;
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		(*it).setReal(xreal[1] >> decimation_shifts::post8);
		(*it).setImag(yimag[1] >> decimation_shifts::post8);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate16_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	// Offset tuning: 4x downsample and rotate, then
	// downsample 4x more. [ rotate:  0, 1, -3, 2, -4, -5, 7, -6]
	qint32 xreal[4], yimag[4];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 31; )
	{
		for (int i = 0; i < 4; i++)
		{
			xreal[i] = (buf[pos+0] - buf[pos+3] + buf[pos+7] - buf[pos+4]) << decimation_shifts::pre16;
			yimag[i] = (buf[pos+1] - buf[pos+5] + buf[pos+2] - buf[pos+6]) << decimation_shifts::pre16;
			pos += 8;
		}
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		m_decimator2.myDecimate(xreal[2], yimag[2], &xreal[3], &yimag[3]);
		m_decimator4.myDecimate(xreal[1], yimag[1], &xreal[3], &yimag[3]);
		(*it).setReal(xreal[3] >> decimation_shifts::post16);
		(*it).setImag(yimag[3] >> decimation_shifts::post16);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate16_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	// Offset tuning: 4x downsample and rotate, then
	// downsample 4x more. [ rotate:  1, 0, -2, 3, -5, -4, 6, -7]
	qint32 xreal[4], yimag[4];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 31; )
	{
		for (int i = 0; i < 4; i++)
		{
			xreal[i] = (buf[pos+1] - buf[pos+2] - buf[pos+5] + buf[pos+6]) << decimation_shifts::pre16;
			yimag[i] = (buf[pos+4] + buf[pos+7] - buf[pos+0] - buf[pos+3]) << decimation_shifts::pre16;
			pos += 8;
		}
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		m_decimator2.myDecimate(xreal[2], yimag[2], &xreal[3], &yimag[3]);
		m_decimator4.myDecimate(xreal[1], yimag[1], &xreal[3], &yimag[3]);
		(*it).setReal(xreal[3] >> decimation_shifts::post16);
		(*it).setImag(yimag[3] >> decimation_shifts::post16);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate32_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal[8], yimag[8];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 63; )
	{
		for (int i = 0; i < 8; i++)
		{
			xreal[i] = (buf[pos+0] - buf[pos+3] + buf[pos+7] - buf[pos+4]) << decimation_shifts::pre32;
			yimag[i] = (buf[pos+1] - buf[pos+5] + buf[pos+2] - buf[pos+6]) << decimation_shifts::pre32;
			pos += 8;
		}
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		m_decimator2.myDecimate(xreal[2], yimag[2], &xreal[3], &yimag[3]);
		m_decimator2.myDecimate(xreal[4], yimag[4], &xreal[5], &yimag[5]);
		m_decimator2.myDecimate(xreal[6], yimag[6], &xreal[7], &yimag[7]);
		m_decimator4.myDecimate(xreal[1], yimag[1], &xreal[3], &yimag[3]);
		m_decimator4.myDecimate(xreal[5], yimag[5], &xreal[7], &yimag[7]);
		m_decimator8.myDecimate(xreal[3], yimag[3], &xreal[7], &yimag[7]);
		(*it).setReal(xreal[7] >> decimation_shifts::post32);
		(*it).setImag(yimag[7] >> decimation_shifts::post32);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate32_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal[8], yimag[8];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 63; )
	{
		for (int i = 0; i < 8; i++)
		{
			xreal[i] = (buf[pos+1] - buf[pos+2] - buf[pos+5] + buf[pos+6]) << decimation_shifts::pre32;
			yimag[i] = (buf[pos+4] + buf[pos+7] - buf[pos+0] - buf[pos+3]) << decimation_shifts::pre32;
			pos += 8;
		}
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		m_decimator2.myDecimate(xreal[2], yimag[2], &xreal[3], &yimag[3]);
		m_decimator2.myDecimate(xreal[4], yimag[4], &xreal[5], &yimag[5]);
		m_decimator2.myDecimate(xreal[6], yimag[6], &xreal[7], &yimag[7]);
		m_decimator4.myDecimate(xreal[1], yimag[1], &xreal[3], &yimag[3]);
		m_decimator4.myDecimate(xreal[5], yimag[5], &xreal[7], &yimag[7]);
		m_decimator8.myDecimate(xreal[3], yimag[3], &xreal[7], &yimag[7]);
		(*it).setReal(xreal[7] >> decimation_shifts::post32);
		(*it).setImag(yimag[7] >> decimation_shifts::post32);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate64_inf(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal[16], yimag[16];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 127; )
	{
		for (int i = 0; i < 16; i++)
		{
			xreal[i] = (buf[pos+0] - buf[pos+3] + buf[pos+7] - buf[pos+4]) << decimation_shifts::pre64;
			yimag[i] = (buf[pos+1] - buf[pos+5] + buf[pos+2] - buf[pos+6]) << decimation_shifts::pre64;
			pos += 8;
		}
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		m_decimator2.myDecimate(xreal[2], yimag[2], &xreal[3], &yimag[3]);
		m_decimator2.myDecimate(xreal[4], yimag[4], &xreal[5], &yimag[5]);
		m_decimator2.myDecimate(xreal[6], yimag[6], &xreal[7], &yimag[7]);
		m_decimator2.myDecimate(xreal[8], yimag[8], &xreal[9], &yimag[9]);
		m_decimator2.myDecimate(xreal[10], yimag[10], &xreal[11], &yimag[11]);
		m_decimator2.myDecimate(xreal[12], yimag[12], &xreal[13], &yimag[13]);
		m_decimator2.myDecimate(xreal[14], yimag[14], &xreal[15], &yimag[15]);
		m_decimator4.myDecimate(xreal[1], yimag[1], &xreal[3], &yimag[3]);
		m_decimator4.myDecimate(xreal[5], yimag[5], &xreal[7], &yimag[7]);
		m_decimator4.myDecimate(xreal[9], yimag[9], &xreal[11], &yimag[11]);
		m_decimator4.myDecimate(xreal[13], yimag[13], &xreal[15], &yimag[15]);
		m_decimator8.myDecimate(xreal[3], yimag[3], &xreal[7], &yimag[7]);
		m_decimator8.myDecimate(xreal[11], yimag[11], &xreal[15], &yimag[15]);
		m_decimator16.myDecimate(xreal[7], yimag[7], &xreal[15], &yimag[15]);
		(*it).setReal(xreal[15] >> decimation_shifts::post64);
		(*it).setImag(yimag[15] >> decimation_shifts::post64);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate64_sup(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 xreal[16], yimag[16];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 127; )
	{
		for (int i = 0; i < 16; i++)
		{
			xreal[i] = (buf[pos+1] - buf[pos+2] - buf[pos+5] + buf[pos+6]) << decimation_shifts::pre32;
			yimag[i] = (buf[pos+4] + buf[pos+7] - buf[pos+0] - buf[pos+3]) << decimation_shifts::pre32;
			pos += 8;
		}
		m_decimator2.myDecimate(xreal[0], yimag[0], &xreal[1], &yimag[1]);
		m_decimator2.myDecimate(xreal[2], yimag[2], &xreal[3], &yimag[3]);
		m_decimator2.myDecimate(xreal[4], yimag[4], &xreal[5], &yimag[5]);
		m_decimator2.myDecimate(xreal[6], yimag[6], &xreal[7], &yimag[7]);
		m_decimator2.myDecimate(xreal[8], yimag[8], &xreal[9], &yimag[9]);
		m_decimator2.myDecimate(xreal[10], yimag[10], &xreal[11], &yimag[11]);
		m_decimator2.myDecimate(xreal[12], yimag[12], &xreal[13], &yimag[13]);
		m_decimator2.myDecimate(xreal[14], yimag[14], &xreal[15], &yimag[15]);
		m_decimator4.myDecimate(xreal[1], yimag[1], &xreal[3], &yimag[3]);
		m_decimator4.myDecimate(xreal[5], yimag[5], &xreal[7], &yimag[7]);
		m_decimator4.myDecimate(xreal[9], yimag[9], &xreal[11], &yimag[11]);
		m_decimator4.myDecimate(xreal[13], yimag[13], &xreal[15], &yimag[15]);
		m_decimator8.myDecimate(xreal[3], yimag[3], &xreal[7], &yimag[7]);
		m_decimator8.myDecimate(xreal[11], yimag[11], &xreal[15], &yimag[15]);
		m_decimator16.myDecimate(xreal[7], yimag[7], &xreal[15], &yimag[15]);
		(*it).setReal(xreal[15] >> decimation_shifts::post64);
		(*it).setImag(yimag[15] >> decimation_shifts::post64);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate2_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 intbuf[2];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 3; pos += 4)
	{
		intbuf[0]  = buf[pos+2] << decimation_shifts::pre2;
		intbuf[1]  = buf[pos+3] << decimation_shifts::pre2;
		m_decimator2.myDecimate(
				buf[pos+0] << decimation_shifts::pre2,
				buf[pos+1] << decimation_shifts::pre2,
				&intbuf[0],
				&intbuf[1]);
		(*it).setReal(intbuf[0] >> decimation_shifts::post2);
		(*it).setImag(intbuf[1] >> decimation_shifts::post2);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate4_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 intbuf[4];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 7; pos += 8)
	{
		intbuf[0]  = buf[pos+2] << decimation_shifts::pre4;
		intbuf[1]  = buf[pos+3] << decimation_shifts::pre4;
		intbuf[2]  = buf[pos+6] << decimation_shifts::pre4;
		intbuf[3]  = buf[pos+7] << decimation_shifts::pre4;
		m_decimator2.myDecimate(
				buf[pos+0] << decimation_shifts::pre4,
				buf[pos+1] << decimation_shifts::pre4,
				&intbuf[0],
				&intbuf[1]);
		m_decimator2.myDecimate(
				buf[pos+4] << decimation_shifts::pre4,
				buf[pos+5] << decimation_shifts::pre4,
				&intbuf[2],
				&intbuf[3]);
		m_decimator4.myDecimate(
				intbuf[0],
				intbuf[1],
				&intbuf[2],
				&intbuf[3]);
		(*it).setReal(intbuf[2] >> decimation_shifts::post4);
		(*it).setImag(intbuf[3] >> decimation_shifts::post4);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate8_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 intbuf[8];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 15; pos += 16)
	{
		intbuf[0]  = buf[pos+2] << decimation_shifts::pre8;
		intbuf[1]  = buf[pos+3] << decimation_shifts::pre8;
		intbuf[2]  = buf[pos+6] << decimation_shifts::pre8;
		intbuf[3]  = buf[pos+7] << decimation_shifts::pre8;
		intbuf[4]  = buf[pos+10] << decimation_shifts::pre8;
		intbuf[5]  = buf[pos+11] << decimation_shifts::pre8;
		intbuf[6]  = buf[pos+14] << decimation_shifts::pre8;
		intbuf[7]  = buf[pos+15] << decimation_shifts::pre8;
		m_decimator2.myDecimate(
				buf[pos+0] << decimation_shifts::pre8,
				buf[pos+1] << decimation_shifts::pre8,
				&intbuf[0],
				&intbuf[1]);
		m_decimator2.myDecimate(
				buf[pos+4] << decimation_shifts::pre8,
				buf[pos+5] << decimation_shifts::pre8,
				&intbuf[2],
				&intbuf[3]);
		m_decimator2.myDecimate(
				buf[pos+8] << decimation_shifts::pre8,
				buf[pos+9] << decimation_shifts::pre8,
				&intbuf[4],
				&intbuf[5]);
		m_decimator2.myDecimate(
				buf[pos+12] << decimation_shifts::pre8,
				buf[pos+13] << decimation_shifts::pre8,
				&intbuf[6],
				&intbuf[7]);
		m_decimator4.myDecimate(
				intbuf[0],
				intbuf[1],
				&intbuf[2],
				&intbuf[3]);
		m_decimator4.myDecimate(
				intbuf[4],
				intbuf[5],
				&intbuf[6],
				&intbuf[7]);
		m_decimator8.myDecimate(
				intbuf[2],
				intbuf[3],
				&intbuf[6],
				&intbuf[7]);
		(*it).setReal(intbuf[6] >> decimation_shifts::post8);
		(*it).setImag(intbuf[7] >> decimation_shifts::post8);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate16_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 intbuf[16];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 31; pos += 32)
	{
		intbuf[0]  = buf[pos+2] << decimation_shifts::pre16;
		intbuf[1]  = buf[pos+3] << decimation_shifts::pre16;
		intbuf[2]  = buf[pos+6] << decimation_shifts::pre16;
		intbuf[3]  = buf[pos+7] << decimation_shifts::pre16;
		intbuf[4]  = buf[pos+10] << decimation_shifts::pre16;
		intbuf[5]  = buf[pos+11] << decimation_shifts::pre16;
		intbuf[6]  = buf[pos+14] << decimation_shifts::pre16;
		intbuf[7]  = buf[pos+15] << decimation_shifts::pre16;
		intbuf[8]  = buf[pos+18] << decimation_shifts::pre16;
		intbuf[9]  = buf[pos+19] << decimation_shifts::pre16;
		intbuf[10] = buf[pos+22] << decimation_shifts::pre16;
		intbuf[11] = buf[pos+23] << decimation_shifts::pre16;
		intbuf[12] = buf[pos+26] << decimation_shifts::pre16;
		intbuf[13] = buf[pos+27] << decimation_shifts::pre16;
		intbuf[14] = buf[pos+30] << decimation_shifts::pre16;
		intbuf[15] = buf[pos+31] << decimation_shifts::pre16;
		m_decimator2.myDecimate(
				buf[pos+0] << decimation_shifts::pre16,
				buf[pos+1] << decimation_shifts::pre16,
				&intbuf[0],
				&intbuf[1]);
		m_decimator2.myDecimate(
				buf[pos+4] << decimation_shifts::pre16,
				buf[pos+5] << decimation_shifts::pre16,
				&intbuf[2],
				&intbuf[3]);
		m_decimator2.myDecimate(
				buf[pos+8] << decimation_shifts::pre16,
				buf[pos+9] << decimation_shifts::pre16,
				&intbuf[4],
				&intbuf[5]);
		m_decimator2.myDecimate(
				buf[pos+12] << decimation_shifts::pre16,
				buf[pos+13] << decimation_shifts::pre16,
				&intbuf[6],
				&intbuf[7]);
		m_decimator2.myDecimate(
				buf[pos+16] << decimation_shifts::pre16,
				buf[pos+17] << decimation_shifts::pre16,
				&intbuf[8],
				&intbuf[9]);
		m_decimator2.myDecimate(
				buf[pos+20] << decimation_shifts::pre16,
				buf[pos+21] << decimation_shifts::pre16,
				&intbuf[10],
				&intbuf[11]);
		m_decimator2.myDecimate(
				buf[pos+24] << decimation_shifts::pre16,
				buf[pos+25] << decimation_shifts::pre16,
				&intbuf[12],
				&intbuf[13]);
		m_decimator2.myDecimate(
				buf[pos+28] << decimation_shifts::pre16,
				buf[pos+29] << decimation_shifts::pre16,
				&intbuf[14],
				&intbuf[15]);
		m_decimator4.myDecimate(
				intbuf[0],
				intbuf[1],
				&intbuf[2],
				&intbuf[3]);
		m_decimator4.myDecimate(
				intbuf[4],
				intbuf[5],
				&intbuf[6],
				&intbuf[7]);
		m_decimator4.myDecimate(
				intbuf[8],
				intbuf[9],
				&intbuf[10],
				&intbuf[11]);
		m_decimator4.myDecimate(
				intbuf[12],
				intbuf[13],
				&intbuf[14],
				&intbuf[15]);
		m_decimator8.myDecimate(
				intbuf[2],
				intbuf[3],
				&intbuf[6],
				&intbuf[7]);
		m_decimator8.myDecimate(
				intbuf[10],
				intbuf[11],
				&intbuf[14],
				&intbuf[15]);
		m_decimator16.myDecimate(
				intbuf[6],
				intbuf[7],
				&intbuf[14],
				&intbuf[15]);
		(*it).setReal(intbuf[14] >> decimation_shifts::post16);
		(*it).setImag(intbuf[15] >> decimation_shifts::post16);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate32_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 intbuf[32];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 63; pos += 64)
	{
		intbuf[0]  = buf[pos+2] << decimation_shifts::pre32;
		intbuf[1]  = buf[pos+3] << decimation_shifts::pre32;
		intbuf[2]  = buf[pos+6] << decimation_shifts::pre32;
		intbuf[3]  = buf[pos+7] << decimation_shifts::pre32;
		intbuf[4]  = buf[pos+10] << decimation_shifts::pre32;
		intbuf[5]  = buf[pos+11] << decimation_shifts::pre32;
		intbuf[6]  = buf[pos+14] << decimation_shifts::pre32;
		intbuf[7]  = buf[pos+15] << decimation_shifts::pre32;
		intbuf[8]  = buf[pos+18] << decimation_shifts::pre32;
		intbuf[9]  = buf[pos+19] << decimation_shifts::pre32;
		intbuf[10] = buf[pos+22] << decimation_shifts::pre32;
		intbuf[11] = buf[pos+23] << decimation_shifts::pre32;
		intbuf[12] = buf[pos+26] << decimation_shifts::pre32;
		intbuf[13] = buf[pos+27] << decimation_shifts::pre32;
		intbuf[14] = buf[pos+30] << decimation_shifts::pre32;
		intbuf[15] = buf[pos+31] << decimation_shifts::pre32;
		intbuf[16] = buf[pos+34] << decimation_shifts::pre32;
		intbuf[17] = buf[pos+35] << decimation_shifts::pre32;
		intbuf[18] = buf[pos+38] << decimation_shifts::pre32;
		intbuf[19] = buf[pos+39] << decimation_shifts::pre32;
		intbuf[20] = buf[pos+42] << decimation_shifts::pre32;
		intbuf[21] = buf[pos+43] << decimation_shifts::pre32;
		intbuf[22] = buf[pos+46] << decimation_shifts::pre32;
		intbuf[23] = buf[pos+47] << decimation_shifts::pre32;
		intbuf[24] = buf[pos+50] << decimation_shifts::pre32;
		intbuf[25] = buf[pos+51] << decimation_shifts::pre32;
		intbuf[26] = buf[pos+54] << decimation_shifts::pre32;
		intbuf[27] = buf[pos+55] << decimation_shifts::pre32;
		intbuf[28] = buf[pos+58] << decimation_shifts::pre32;
		intbuf[29] = buf[pos+59] << decimation_shifts::pre32;
		intbuf[30] = buf[pos+62] << decimation_shifts::pre32;
		intbuf[31] = buf[pos+63] << decimation_shifts::pre32;
		m_decimator2.myDecimate(
				buf[pos+0] << decimation_shifts::pre32,
				buf[pos+1] << decimation_shifts::pre32,
				&intbuf[0],
				&intbuf[1]);
		m_decimator2.myDecimate(
				buf[pos+4] << decimation_shifts::pre32,
				buf[pos+5] << decimation_shifts::pre32,
				&intbuf[2],
				&intbuf[3]);
		m_decimator2.myDecimate(
				buf[pos+8] << decimation_shifts::pre32,
				buf[pos+9] << decimation_shifts::pre32,
				&intbuf[4],
				&intbuf[5]);
		m_decimator2.myDecimate(
				buf[pos+12] << decimation_shifts::pre32,
				buf[pos+13] << decimation_shifts::pre32,
				&intbuf[6],
				&intbuf[7]);
		m_decimator2.myDecimate(
				buf[pos+16] << decimation_shifts::pre32,
				buf[pos+17] << decimation_shifts::pre32,
				&intbuf[8],
				&intbuf[9]);
		m_decimator2.myDecimate(
				buf[pos+20] << decimation_shifts::pre32,
				buf[pos+21] << decimation_shifts::pre32,
				&intbuf[10],
				&intbuf[11]);
		m_decimator2.myDecimate(
				buf[pos+24] << decimation_shifts::pre32,
				buf[pos+25] << decimation_shifts::pre32,
				&intbuf[12],
				&intbuf[13]);
		m_decimator2.myDecimate(
				buf[pos+28] << decimation_shifts::pre32,
				buf[pos+29] << decimation_shifts::pre32,
				&intbuf[14],
				&intbuf[15]);
		m_decimator2.myDecimate(
				buf[pos+32] << decimation_shifts::pre32,
				buf[pos+33] << decimation_shifts::pre32,
				&intbuf[16],
				&intbuf[17]);
		m_decimator2.myDecimate(
				buf[pos+36] << decimation_shifts::pre32,
				buf[pos+37] << decimation_shifts::pre32,
				&intbuf[18],
				&intbuf[19]);
		m_decimator2.myDecimate(
				buf[pos+40] << decimation_shifts::pre32,
				buf[pos+41] << decimation_shifts::pre32,
				&intbuf[20],
				&intbuf[21]);
		m_decimator2.myDecimate(
				buf[pos+44] << decimation_shifts::pre32,
				buf[pos+45] << decimation_shifts::pre32,
				&intbuf[22],
				&intbuf[23]);
		m_decimator2.myDecimate(
				buf[pos+48] << decimation_shifts::pre32,
				buf[pos+49] << decimation_shifts::pre32,
				&intbuf[24],
				&intbuf[25]);
		m_decimator2.myDecimate(
				buf[pos+52] << decimation_shifts::pre32,
				buf[pos+53] << decimation_shifts::pre32,
				&intbuf[26],
				&intbuf[27]);
		m_decimator2.myDecimate(
				buf[pos+56] << decimation_shifts::pre32,
				buf[pos+57] << decimation_shifts::pre32,
				&intbuf[28],
				&intbuf[29]);
		m_decimator2.myDecimate(
				buf[pos+60] << decimation_shifts::pre32,
				buf[pos+61] << decimation_shifts::pre32,
				&intbuf[30],
				&intbuf[31]);
		m_decimator4.myDecimate(
				intbuf[0],
				intbuf[1],
				&intbuf[2],
				&intbuf[3]);
		m_decimator4.myDecimate(
				intbuf[4],
				intbuf[5],
				&intbuf[6],
				&intbuf[7]);
		m_decimator4.myDecimate(
				intbuf[8],
				intbuf[9],
				&intbuf[10],
				&intbuf[11]);
		m_decimator4.myDecimate(
				intbuf[12],
				intbuf[13],
				&intbuf[14],
				&intbuf[15]);
		m_decimator4.myDecimate(
				intbuf[16],
				intbuf[17],
				&intbuf[18],
				&intbuf[19]);
		m_decimator4.myDecimate(
				intbuf[20],
				intbuf[21],
				&intbuf[22],
				&intbuf[23]);
		m_decimator4.myDecimate(
				intbuf[24],
				intbuf[25],
				&intbuf[26],
				&intbuf[27]);
		m_decimator4.myDecimate(
				intbuf[28],
				intbuf[29],
				&intbuf[30],
				&intbuf[31]);
		m_decimator8.myDecimate(
				intbuf[2],
				intbuf[3],
				&intbuf[6],
				&intbuf[7]);
		m_decimator8.myDecimate(
				intbuf[10],
				intbuf[11],
				&intbuf[14],
				&intbuf[15]);
		m_decimator8.myDecimate(
				intbuf[18],
				intbuf[19],
				&intbuf[22],
				&intbuf[23]);
		m_decimator8.myDecimate(
				intbuf[26],
				intbuf[27],
				&intbuf[30],
				&intbuf[31]);
		m_decimator16.myDecimate(
				intbuf[6],
				intbuf[7],
				&intbuf[14],
				&intbuf[15]);
		m_decimator16.myDecimate(
				intbuf[22],
				intbuf[23],
				&intbuf[30],
				&intbuf[31]);
		m_decimator32.myDecimate(
				intbuf[14],
				intbuf[15],
				&intbuf[30],
				&intbuf[31]);
		(**it).setReal(intbuf[30] >> decimation_shifts::post32);
		(**it).setImag(intbuf[31] >> decimation_shifts::post32);
		fifo.bumpIndex(it);
	}
}
template
void SampleSinkFifoDecimator::decimate64_cen(SampleSinkFifoDoubleBuffered& fifo, const T* buf, qint32 len)
{
	qint32 intbuf[64];
	SampleVector::iterator it;
	fifo.getWriteIterator(it);
	for (int pos = 0; pos < len - 127; pos += 128)
	{
		intbuf[0]  = buf[pos+2] << decimation_shifts::pre64;
		intbuf[1]  = buf[pos+3] << decimation_shifts