WSJT-X/lib/qra/qracodes/pdmath.c

// pdmath.c
// Elementary math on probability distributions
// 
// (c) 2016 - Nico Palermo, IV3NWV - Microtelecom Srl, Italy
// ------------------------------------------------------------------------------
// This file is part of the qracodes project, a Forward Error Control
// encoding/decoding package based on Q-ary RA (Repeat and Accumulate) LDPC codes.
//
//    qracodes is free software: you can redistribute it and/or modify
//    it under the terms of the GNU General Public License as published by
//    the Free Software Foundation, either version 3 of the License, or
//    (at your option) any later version.
//    qracodes is distributed in the hope that it will be useful,
//    but WITHOUT ANY WARRANTY; without even the implied warranty of
//    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
//    GNU General Public License for more details.

//    You should have received a copy of the GNU General Public License
//    along with qracodes source distribution.  
//    If not, see <http://www.gnu.org/licenses/>.

#include "pdmath.h"

typedef const float *ppd_uniform;
typedef void  (*ppd_imul)(float*,const float*);
typedef float (*ppd_norm)(float*);

// define vector size in function of its logarithm in base 2
static const int pd_log2dim[7] = {
	1,2,4,8,16,32,64
};

// define uniform distributions of given size
static const float pd_uniform1[1] = {
	1.
};
static const float pd_uniform2[2] = {
	1./2., 1./2.
};
static const float pd_uniform4[4] = {
	1./4., 1./4.,1./4., 1./4.
};
static const float pd_uniform8[8] = {
	1./8., 1./8.,1./8., 1./8.,1./8., 1./8.,1./8., 1./8.
};
static const float pd_uniform16[16] = {
	1./16., 1./16., 1./16., 1./16.,1./16., 1./16.,1./16., 1./16.,
	1./16., 1./16., 1./16., 1./16.,1./16., 1./16.,1./16., 1./16.
};
static const float pd_uniform32[32] = {
	1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.,
	1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.,
	1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.,
	1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.
};
static const float pd_uniform64[64] = {
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,
	1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.

};

static const ppd_uniform pd_uniform_tab[7] = {
	pd_uniform1,
	pd_uniform2,
	pd_uniform4,
	pd_uniform8,
	pd_uniform16,
	pd_uniform32,
	pd_uniform64
};

// returns a pointer to the uniform distribution of the given logsize
const float *pd_uniform(int nlogdim)
{
	return pd_uniform_tab[nlogdim];
}

// in-place multiplication functions
// compute dst = dst*src for any element of the distrib

static void pd_imul1(float *dst, const float *src)
{
		dst[0] *= src[0]; 
}

static void pd_imul2(float *dst, const float *src)
{
		dst[0] *= src[0]; dst[1] *= src[1]; 
}
static void pd_imul4(float *dst, const float *src)
{
		dst[0] *= src[0]; dst[1] *= src[1]; 
		dst[2] *= src[2]; dst[3] *= src[3]; 
}
static void pd_imul8(float *dst, const float *src)
{
		dst[0] *= src[0]; dst[1] *= src[1]; dst[2] *= src[2]; dst[3] *= src[3]; 
		dst[4] *= src[4]; dst[5] *= src[5]; dst[6] *= src[6]; dst[7] *= src[7]; 
}
static void pd_imul16(float *dst, const float *src)
{
		dst[0] *= src[0];  dst[1] *= src[1];  dst[2] *= src[2];  dst[3] *= src[3]; 
		dst[4] *= src[4];  dst[5] *= src[5];  dst[6] *= src[6];  dst[7] *= src[7]; 
		dst[8] *= src[8];  dst[9] *= src[9];  dst[10]*= src[10]; dst[11]*= src[11]; 
		dst[12]*= src[12]; dst[13]*= src[13]; dst[14]*= src[14]; dst[15]*= src[15]; 
}
static void pd_imul32(float *dst, const float *src)
{
	pd_imul16(dst,src);
	pd_imul16(dst+16,src+16);
}
static void pd_imul64(float *dst, const float *src)
{
	pd_imul16(dst, src);
	pd_imul16(dst+16, src+16);
	pd_imul16(dst+32, src+32);
	pd_imul16(dst+48, src+48);
}

static const ppd_imul pd_imul_tab[7] = {
	pd_imul1,
	pd_imul2,
	pd_imul4,
	pd_imul8,
	pd_imul16,
	pd_imul32,
	pd_imul64
};

// in place multiplication
// compute dst = dst*src for any element of the distrib give their log2 size
// arguments must be pointers to array of floats of the given size
void pd_imul(float *dst, const float *src, int nlogdim)
{
	pd_imul_tab[nlogdim](dst,src);
}

static float pd_norm1(float *ppd)
{
	float t = ppd[0];
	ppd[0] = 1.f;
	return t;
}

static float pd_norm2(float *ppd)
{
	float t,to;

	t =ppd[0]; t +=ppd[1];

	if (t<=0) {
		pd_init(ppd,pd_uniform(1),pd_log2dim[1]);
		return t;
		}

	to = t;
	t = 1.f/t;
	ppd[0] *=t; ppd[1] *=t; 
	return to;

}

static float pd_norm4(float *ppd)
{
	float t,to;

	t =ppd[0]; t +=ppd[1]; t +=ppd[2]; t +=ppd[3];

	if (t<=0) {
		pd_init(ppd,pd_uniform(2),pd_log2dim[2]);
		return t;
		}

	to = t;
	t = 1.f/t;
	ppd[0] *=t; ppd[1] *=t; ppd[2] *=t; ppd[3] *=t; 
	return to;
}

static float pd_norm8(float *ppd)
{
	float t,to;

	t  =ppd[0]; t +=ppd[1]; t +=ppd[2]; t +=ppd[3];
	t +=ppd[4]; t +=ppd[5]; t +=ppd[6]; t +=ppd[7];

	if (t<=0) {
		pd_init(ppd,pd_uniform(3),pd_log2dim[3]);
		return t;
		}

	to = t;
	t = 1.f/t;
	ppd[0] *=t; ppd[1] *=t; ppd[2] *=t; ppd[3] *=t; 
	ppd[4] *=t; ppd[5] *=t; ppd[6] *=t; ppd[7] *=t; 
	return to;
}
static float pd_norm16(float *ppd)
{
	float t,to;

	t  =ppd[0];  t +=ppd[1];  t +=ppd[2];  t +=ppd[3];
	t +=ppd[4];  t +=ppd[5];  t +=ppd[6];  t +=ppd[7];
	t +=ppd[8];  t +=ppd[9];  t +=ppd[10]; t +=ppd[11];
	t +=ppd[12]; t +=ppd[13]; t +=ppd[14]; t +=ppd[15];

	if (t<=0) {
		pd_init(ppd,pd_uniform(4),pd_log2dim[4]);
		return t;
		}

	to = t;
	t = 1.f/t;
	ppd[0]  *=t; ppd[1]  *=t; ppd[2]  *=t; ppd[3]  *=t; 
	ppd[4]  *=t; ppd[5]  *=t; ppd[6]  *=t; ppd[7]  *=t; 
	ppd[8]  *=t; ppd[9]  *=t; ppd[10] *=t; ppd[11] *=t; 
	ppd[12] *=t; ppd[13] *=t; ppd[14] *=t; ppd[15] *=t; 

	return to;
}
static float pd_norm32(float *ppd)
{
	float t,to;

	t  =ppd[0];  t +=ppd[1];  t +=ppd[2];  t +=ppd[3];
	t +=ppd[4];  t +=ppd[5];  t +=ppd[6];  t +=ppd[7];
	t +=ppd[8];  t +=ppd[9];  t +=ppd[10]; t +=ppd[11];
	t +=ppd[12]; t +=ppd[13]; t +=ppd[14]; t +=ppd[15];
	t +=ppd[16]; t +=ppd[17]; t +=ppd[18]; t +=ppd[19];
	t +=ppd[20]; t +=ppd[21]; t +=ppd[22]; t +=ppd[23];
	t +=ppd[24]; t +=ppd[25]; t +=ppd[26]; t +=ppd[27];
	t +=ppd[28]; t +=ppd[29]; t +=ppd[30]; t +=ppd[31];

	if (t<=0) {
		pd_init(ppd,pd_uniform(5),pd_log2dim[5]);
		return t;
		}

	to = t;
	t = 1.f/t;
	ppd[0]  *=t; ppd[1]  *=t; ppd[2]  *=t; ppd[3]  *=t; 
	ppd[4]  *=t; ppd[5]  *=t; ppd[6]  *=t; ppd[7]  *=t; 
	ppd[8]  *=t; ppd[9]  *=t; ppd[10] *=t; ppd[11] *=t; 
	ppd[12] *=t; ppd[13] *=t; ppd[14] *=t; ppd[15] *=t; 
	ppd[16] *=t; ppd[17] *=t; ppd[18] *=t; ppd[19] *=t; 
	ppd[20] *=t; ppd[21] *=t; ppd[22] *=t; ppd[23] *=t; 
	ppd[24] *=t; ppd[25] *=t; ppd[26] *=t; ppd[27] *=t; 
	ppd[28] *=t; ppd[29] *=t; ppd[30] *=t; ppd[31] *=t; 

	return to;
}

static float pd_norm64(float *ppd)
{
	float t,to;

	t  =ppd[0];  t +=ppd[1];  t +=ppd[2];  t +=ppd[3];
	t +=ppd[4];  t +=ppd[5];  t +=ppd[6];  t +=ppd[7];
	t +=ppd[8];  t +=ppd[9];  t +=ppd[10]; t +=ppd[11];
	t +=ppd[12]; t +=ppd[13]; t +=ppd[14]; t +=ppd[15];
	t +=ppd[16]; t +=ppd[17]; t +=ppd[18]; t +=ppd[19];
	t +=ppd[20]; t +=ppd[21]; t +=ppd[22]; t +=ppd[23];
	t +=ppd[24]; t +=ppd[25]; t +=ppd[26]; t +=ppd[27];
	t +=ppd[28]; t +=ppd[29]; t +=ppd[30]; t +=ppd[31];

	t +=ppd[32]; t +=ppd[33]; t +=ppd[34]; t +=ppd[35];
	t +=ppd[36]; t +=ppd[37]; t +=ppd[38]; t +=ppd[39];
	t +=ppd[40]; t +=ppd[41]; t +=ppd[42]; t +=ppd[43];
	t +=ppd[44]; t +=ppd[45]; t +=ppd[46]; t +=ppd[47];
	t +=ppd[48]; t +=ppd[49]; t +=ppd[50]; t +=ppd[51];
	t +=ppd[52]; t +=ppd[53]; t +=ppd[54]; t +=ppd[55];
	t +=ppd[56]; t +=ppd[57]; t +=ppd[58]; t +=ppd[59];
	t +=ppd[60]; t +=ppd[61]; t +=ppd[62]; t +=ppd[63];

	if (t<=0) {
		pd_init(ppd,pd_uniform(6),pd_log2dim[6]);
		return t;
		}

	to = t;
	t = 1.0f/t;
	ppd[0]  *=t; ppd[1]  *=t; ppd[2]  *=t; ppd[3]  *=t; 
	ppd[4]  *=t; ppd[5]  *=t; ppd[6]  *=t; ppd[7]  *=t; 
	ppd[8]  *=t; ppd[9]  *=t; ppd[10] *=t; ppd[11] *=t; 
	ppd[12] *=t; ppd[13] *=t; ppd[14] *=t; ppd[15] *=t; 
	ppd[16] *=t; ppd[17] *=t; ppd[18] *=t; ppd[19] *=t; 
	ppd[20] *=t; ppd[21] *=t; ppd[22] *=t; ppd[23] *=t; 
	ppd[24] *=t; ppd[25] *=t; ppd[26] *=t; ppd[27] *=t; 
	ppd[28] *=t; ppd[29] *=t; ppd[30] *=t; ppd[31] *=t; 

	ppd[32] *=t; ppd[33] *=t; ppd[34] *=t; ppd[35] *=t; 
	ppd[36] *=t; ppd[37] *=t; ppd[38] *=t; ppd[39] *=t; 
	ppd[40] *=t; ppd[41] *=t; ppd[42] *=t; ppd[43] *=t; 
	ppd[44] *=t; ppd[45] *=t; ppd[46] *=t; ppd[47] *=t; 
	ppd[48] *=t; ppd[49] *=t; ppd[50] *=t; ppd[51] *=t; 
	ppd[52] *=t; ppd[53] *=t; ppd[54] *=t; ppd[55] *=t; 
	ppd[56] *=t; ppd[57] *=t; ppd[58] *=t; ppd[59] *=t; 
	ppd[60] *=t; ppd[61] *=t; ppd[62] *=t; ppd[63] *=t; 

	return to;
}


static const ppd_norm pd_norm_tab[7] = {
	pd_norm1,
	pd_norm2,
	pd_norm4,
	pd_norm8,
	pd_norm16,
	pd_norm32,
	pd_norm64
};

float pd_norm(float *pd, int nlogdim)
{
	return pd_norm_tab[nlogdim](pd);
}

void pd_memset(float *dst, const float *src, int ndim, int nitems)
{
	int size = PD_SIZE(ndim);
	while(nitems--) {
		memcpy(dst,src,size);
		dst +=ndim;
		}
}

void  pd_fwdperm(float *dst, float *src, const  int *perm, int ndim)
{
	// TODO: non-loop implementation
	while (ndim--) 
		dst[ndim] = src[perm[ndim]];
}

void  pd_bwdperm(float *dst, float *src, const  int *perm, int ndim)
{
	// TODO: non-loop implementation
	while (ndim--) 
		dst[perm[ndim]] = src[ndim];
}

float pd_max(float *src, int ndim)
{
	// TODO: faster implementation

	float cmax=0;  // we assume that prob distributions are always positive
	float cval;

	while (ndim--) {
		cval = src[ndim];
		if (cval>=cmax) {
			cmax = cval;
			}
		}

	return cmax;
}

int pd_argmax(float *pmax, float *src, int ndim)
{
	// TODO: faster implementation

	float cmax=0;  // we assume that prob distributions are always positive
	float cval;
	int idxmax=-1; // indicates that all pd elements are <0

	while (ndim--) {
		cval = src[ndim];
		if (cval>=cmax) {
			cmax = cval;
			idxmax = ndim;
			}
		}

	if (pmax)
		*pmax = cmax;

	return idxmax;
}
Starting to add code for a potential "QRA65" mode. git-svn-id: svn+ssh://svn.code.sf.net/p/wsjt/wsjt/branches/wsjtx@6788 ab8295b8-cf94-4d9e-aec4-7959e3be5d79 2016-06-21 15:07:24 +00:00			`// pdmath.c`
			`// Elementary math on probability distributions`
			`//`
			`// (c) 2016 - Nico Palermo, IV3NWV - Microtelecom Srl, Italy`
			`// ------------------------------------------------------------------------------`
			`// This file is part of the qracodes project, a Forward Error Control`
			`// encoding/decoding package based on Q-ary RA (Repeat and Accumulate) LDPC codes.`
			`//`
			`// qracodes is free software: you can redistribute it and/or modify`
			`// it under the terms of the GNU General Public License as published by`
			`// the Free Software Foundation, either version 3 of the License, or`
			`// (at your option) any later version.`
			`// qracodes is distributed in the hope that it will be useful,`
			`// but WITHOUT ANY WARRANTY; without even the implied warranty of`
			`// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`// GNU General Public License for more details.`

			`// You should have received a copy of the GNU General Public License`
			`// along with qracodes source distribution.`
			`// If not, see <http://www.gnu.org/licenses/>.`

			`#include "pdmath.h"`

			`typedef const float *ppd_uniform;`
			`typedef void (ppd_imul)(float,const float*);`
			`typedef float (ppd_norm)(float);`

			`// define vector size in function of its logarithm in base 2`
			`static const int pd_log2dim[7] = {`
			`1,2,4,8,16,32,64`
			`};`

			`// define uniform distributions of given size`
			`static const float pd_uniform1[1] = {`
			`1.`
			`};`
			`static const float pd_uniform2[2] = {`
			`1./2., 1./2.`
			`};`
			`static const float pd_uniform4[4] = {`
			`1./4., 1./4.,1./4., 1./4.`
			`};`
			`static const float pd_uniform8[8] = {`
			`1./8., 1./8.,1./8., 1./8.,1./8., 1./8.,1./8., 1./8.`
			`};`
			`static const float pd_uniform16[16] = {`
			`1./16., 1./16., 1./16., 1./16.,1./16., 1./16.,1./16., 1./16.,`
			`1./16., 1./16., 1./16., 1./16.,1./16., 1./16.,1./16., 1./16.`
			`};`
			`static const float pd_uniform32[32] = {`
			`1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.,`
			`1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.,`
			`1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.,`
			`1./32., 1./32., 1./32., 1./32.,1./32., 1./32.,1./32., 1./32.`
			`};`
			`static const float pd_uniform64[64] = {`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.,`
			`1./64., 1./64., 1./64., 1./64.,1./64., 1./64.,1./64., 1./64.`

			`};`

			`static const ppd_uniform pd_uniform_tab[7] = {`
			`pd_uniform1,`
			`pd_uniform2,`
			`pd_uniform4,`
			`pd_uniform8,`
			`pd_uniform16,`
			`pd_uniform32,`
			`pd_uniform64`
			`};`

			`// returns a pointer to the uniform distribution of the given logsize`
			`const float *pd_uniform(int nlogdim)`
			`{`
			`return pd_uniform_tab[nlogdim];`
			`}`

			`// in-place multiplication functions`
			`// compute dst = dst*src for any element of the distrib`

			`static void pd_imul1(float dst, const float src)`
			`{`
			`dst[0] *= src[0];`
			`}`

			`static void pd_imul2(float dst, const float src)`
			`{`
			`dst[0] = src[0]; dst[1] = src[1];`
			`}`
			`static void pd_imul4(float dst, const float src)`
			`{`
			`dst[0] = src[0]; dst[1] = src[1];`
			`dst[2] = src[2]; dst[3] = src[3];`
			`}`
			`static void pd_imul8(float dst, const float src)`
			`{`
			`dst[0] = src[0]; dst[1] = src[1]; dst[2] = src[2]; dst[3] = src[3];`
			`dst[4] = src[4]; dst[5] = src[5]; dst[6] = src[6]; dst[7] = src[7];`
			`}`
			`static void pd_imul16(float dst, const float src)`
			`{`
			`dst[0] = src[0]; dst[1] = src[1]; dst[2] = src[2]; dst[3] = src[3];`
			`dst[4] = src[4]; dst[5] = src[5]; dst[6] = src[6]; dst[7] = src[7];`
			`dst[8] = src[8]; dst[9] = src[9]; dst[10]= src[10]; dst[11]= src[11];`
			`dst[12]= src[12]; dst[13]= src[13]; dst[14]= src[14]; dst[15]= src[15];`
			`}`
			`static void pd_imul32(float dst, const float src)`
			`{`
			`pd_imul16(dst,src);`
			`pd_imul16(dst+16,src+16);`
			`}`
			`static void pd_imul64(float dst, const float src)`
			`{`
			`pd_imul16(dst, src);`
			`pd_imul16(dst+16, src+16);`
			`pd_imul16(dst+32, src+32);`
			`pd_imul16(dst+48, src+48);`
			`}`

			`static const ppd_imul pd_imul_tab[7] = {`
			`pd_imul1,`
			`pd_imul2,`
			`pd_imul4,`
			`pd_imul8,`
			`pd_imul16,`
			`pd_imul32,`
			`pd_imul64`
			`};`

			`// in place multiplication`
			`// compute dst = dst*src for any element of the distrib give their log2 size`
			`// arguments must be pointers to array of floats of the given size`
			`void pd_imul(float dst, const float src, int nlogdim)`
			`{`
			`pd_imul_tab[nlogdim](dst,src);`
			`}`

			`static float pd_norm1(float *ppd)`
			`{`
			`float t = ppd[0];`
			`ppd[0] = 1.f;`
			`return t;`
			`}`

			`static float pd_norm2(float *ppd)`
			`{`
			`float t,to;`

			`t =ppd[0]; t +=ppd[1];`

			`if (t<=0) {`
			`pd_init(ppd,pd_uniform(1),pd_log2dim[1]);`
			`return t;`
			`}`

			`to = t;`
			`t = 1.f/t;`
			`ppd[0] =t; ppd[1] =t;`
			`return to;`

			`}`

			`static float pd_norm4(float *ppd)`
			`{`
			`float t,to;`

			`t =ppd[0]; t +=ppd[1]; t +=ppd[2]; t +=ppd[3];`

			`if (t<=0) {`
			`pd_init(ppd,pd_uniform(2),pd_log2dim[2]);`
			`return t;`
			`}`

			`to = t;`
			`t = 1.f/t;`
			`ppd[0] =t; ppd[1] =t; ppd[2] =t; ppd[3] =t;`
			`return to;`
			`}`

			`static float pd_norm8(float *ppd)`
			`{`
			`float t,to;`

			`t =ppd[0]; t +=ppd[1]; t +=ppd[2]; t +=ppd[3];`
			`t +=ppd[4]; t +=ppd[5]; t +=ppd[6]; t +=ppd[7];`

			`if (t<=0) {`
			`pd_init(ppd,pd_uniform(3),pd_log2dim[3]);`
			`return t;`
			`}`

			`to = t;`
			`t = 1.f/t;`
			`ppd[0] =t; ppd[1] =t; ppd[2] =t; ppd[3] =t;`
			`ppd[4] =t; ppd[5] =t; ppd[6] =t; ppd[7] =t;`
			`return to;`
			`}`
			`static float pd_norm16(float *ppd)`
			`{`
			`float t,to;`

			`t =ppd[0]; t +=ppd[1]; t +=ppd[2]; t +=ppd[3];`
			`t +=ppd[4]; t +=ppd[5]; t +=ppd[6]; t +=ppd[7];`
			`t +=ppd[8]; t +=ppd[9]; t +=ppd[10]; t +=ppd[11];`
			`t +=ppd[12]; t +=ppd[13]; t +=ppd[14]; t +=ppd[15];`

			`if (t<=0) {`
			`pd_init(ppd,pd_uniform(4),pd_log2dim[4]);`
			`return t;`
			`}`

			`to = t;`
			`t = 1.f/t;`
			`ppd[0] =t; ppd[1] =t; ppd[2] =t; ppd[3] =t;`
			`ppd[4] =t; ppd[5] =t; ppd[6] =t; ppd[7] =t;`
			`ppd[8] =t; ppd[9] =t; ppd[10] =t; ppd[11] =t;`
			`ppd[12] =t; ppd[13] =t; ppd[14] =t; ppd[15] =t;`

			`return to;`
			`}`
			`static float pd_norm32(float *ppd)`
			`{`
			`float t,to;`

			`t =ppd[0]; t +=ppd[1]; t +=ppd[2]; t +=ppd[3];`
			`t +=ppd[4]; t +=ppd[5]; t +=ppd[6]; t +=ppd[7];`
			`t +=ppd[8]; t +=ppd[9]; t +=ppd[10]; t +=ppd[11];`
			`t +=ppd[12]; t +=ppd[13]; t +=ppd[14]; t +=ppd[15];`
			`t +=ppd[16]; t +=ppd[17]; t +=ppd[18]; t +=ppd[19];`
			`t +=ppd[20]; t +=ppd[21]; t +=ppd[22]; t +=ppd[23];`
			`t +=ppd[24]; t +=ppd[25]; t +=ppd[26]; t +=ppd[27];`
			`t +=ppd[28]; t +=ppd[29]; t +=ppd[30]; t +=ppd[31];`

			`if (t<=0) {`
			`pd_init(ppd,pd_uniform(5),pd_log2dim[5]);`
			`return t;`
			`}`

			`to = t;`
			`t = 1.f/t;`
			`ppd[0] =t; ppd[1] =t; ppd[2] =t; ppd[3] =t;`
			`ppd[4] =t; ppd[5] =t; ppd[6] =t; ppd[7] =t;`
			`ppd[8] =t; ppd[9] =t; ppd[10] =t; ppd[11] =t;`
			`ppd[12] =t; ppd[13] =t; ppd[14] =t; ppd[15] =t;`
			`ppd[16] =t; ppd[17] =t; ppd[18] =t; ppd[19] =t;`
			`ppd[20] =t; ppd[21] =t; ppd[22] =t; ppd[23] =t;`
			`ppd[24] =t; ppd[25] =t; ppd[26] =t; ppd[27] =t;`
			`ppd[28] =t; ppd[29] =t; ppd[30] =t; ppd[31] =t;`

			`return to;`
			`}`

			`static float pd_norm64(float *ppd)`
			`{`
			`float t,to;`

			`t =ppd[0]; t +=ppd[1]; t +=ppd[2]; t +=ppd[3];`
			`t +=ppd[4]; t +=ppd[5]; t +=ppd[6]; t +=ppd[7];`
			`t +=ppd[8]; t +=ppd[9]; t +=ppd[10]; t +=ppd[11];`
			`t +=ppd[12]; t +=ppd[13]; t +=ppd[14]; t +=ppd[15];`
			`t +=ppd[16]; t +=ppd[17]; t +=ppd[18]; t +=ppd[19];`
			`t +=ppd[20]; t +=ppd[21]; t +=ppd[22]; t +=ppd[23];`
			`t +=ppd[24]; t +=ppd[25]; t +=ppd[26]; t +=ppd[27];`
			`t +=ppd[28]; t +=ppd[29]; t +=ppd[30]; t +=ppd[31];`

			`t +=ppd[32]; t +=ppd[33]; t +=ppd[34]; t +=ppd[35];`
			`t +=ppd[36]; t +=ppd[37]; t +=ppd[38]; t +=ppd[39];`
			`t +=ppd[40]; t +=ppd[41]; t +=ppd[42]; t +=ppd[43];`
			`t +=ppd[44]; t +=ppd[45]; t +=ppd[46]; t +=ppd[47];`
			`t +=ppd[48]; t +=ppd[49]; t +=ppd[50]; t +=ppd[51];`
			`t +=ppd[52]; t +=ppd[53]; t +=ppd[54]; t +=ppd[55];`
			`t +=ppd[56]; t +=ppd[57]; t +=ppd[58]; t +=ppd[59];`
			`t +=ppd[60]; t +=ppd[61]; t +=ppd[62]; t +=ppd[63];`

			`if (t<=0) {`
			`pd_init(ppd,pd_uniform(6),pd_log2dim[6]);`
			`return t;`
			`}`

			`to = t;`
			`t = 1.0f/t;`
			`ppd[0] =t; ppd[1] =t; ppd[2] =t; ppd[3] =t;`
			`ppd[4] =t; ppd[5] =t; ppd[6] =t; ppd[7] =t;`
			`ppd[8] =t; ppd[9] =t; ppd[10] =t; ppd[11] =t;`
			`ppd[12] =t; ppd[13] =t; ppd[14] =t; ppd[15] =t;`
			`ppd[16] =t; ppd[17] =t; ppd[18] =t; ppd[19] =t;`
			`ppd[20] =t; ppd[21] =t; ppd[22] =t; ppd[23] =t;`
			`ppd[24] =t; ppd[25] =t; ppd[26] =t; ppd[27] =t;`
			`ppd[28] =t; ppd[29] =t; ppd[30] =t; ppd[31] =t;`

			`ppd[32] =t; ppd[33] =t; ppd[34] =t; ppd[35] =t;`
			`ppd[36] =t; ppd[37] =t; ppd[38] =t; ppd[39] =t;`
			`ppd[40] =t; ppd[41] =t; ppd[42] =t; ppd[43] =t;`
			`ppd[44] =t; ppd[45] =t; ppd[46] =t; ppd[47] =t;`
			`ppd[48] =t; ppd[49] =t; ppd[50] =t; ppd[51] =t;`
			`ppd[52] =t; ppd[53] =t; ppd[54] =t; ppd[55] =t;`
			`ppd[56] =t; ppd[57] =t; ppd[58] =t; ppd[59] =t;`
			`ppd[60] =t; ppd[61] =t; ppd[62] =t; ppd[63] =t;`

			`return to;`
			`}`


			`static const ppd_norm pd_norm_tab[7] = {`
			`pd_norm1,`
			`pd_norm2,`
			`pd_norm4,`
			`pd_norm8,`
			`pd_norm16,`
			`pd_norm32,`
			`pd_norm64`
			`};`

			`float pd_norm(float *pd, int nlogdim)`
			`{`
			`return pd_norm_tab[nlogdim](pd);`
			`}`

			`void pd_memset(float dst, const float src, int ndim, int nitems)`
			`{`
			`int size = PD_SIZE(ndim);`
			`while(nitems--) {`
			`memcpy(dst,src,size);`
			`dst +=ndim;`
			`}`
			`}`

Apply Nico's QRA changes as of 2016/06/23 git-svn-id: svn+ssh://svn.code.sf.net/p/wsjt/wsjt/branches/wsjtx@6801 ab8295b8-cf94-4d9e-aec4-7959e3be5d79 2016-06-23 10:36:18 +00:00			`void pd_fwdperm(float dst, float src, const int *perm, int ndim)`
Starting to add code for a potential "QRA65" mode. git-svn-id: svn+ssh://svn.code.sf.net/p/wsjt/wsjt/branches/wsjtx@6788 ab8295b8-cf94-4d9e-aec4-7959e3be5d79 2016-06-21 15:07:24 +00:00			`{`
			`// TODO: non-loop implementation`
			`while (ndim--)`
			`dst[ndim] = src[perm[ndim]];`
			`}`

Apply Nico's QRA changes as of 2016/06/23 git-svn-id: svn+ssh://svn.code.sf.net/p/wsjt/wsjt/branches/wsjtx@6801 ab8295b8-cf94-4d9e-aec4-7959e3be5d79 2016-06-23 10:36:18 +00:00			`void pd_bwdperm(float dst, float src, const int *perm, int ndim)`
Starting to add code for a potential "QRA65" mode. git-svn-id: svn+ssh://svn.code.sf.net/p/wsjt/wsjt/branches/wsjtx@6788 ab8295b8-cf94-4d9e-aec4-7959e3be5d79 2016-06-21 15:07:24 +00:00			`{`
			`// TODO: non-loop implementation`
			`while (ndim--)`
			`dst[perm[ndim]] = src[ndim];`
			`}`

			`float pd_max(float *src, int ndim)`
			`{`
			`// TODO: faster implementation`

			`float cmax=0; // we assume that prob distributions are always positive`
			`float cval;`

			`while (ndim--) {`
			`cval = src[ndim];`
			`if (cval>=cmax) {`
			`cmax = cval;`
			`}`
			`}`

			`return cmax;`
			`}`

			`int pd_argmax(float pmax, float src, int ndim)`
			`{`
			`// TODO: faster implementation`

			`float cmax=0; // we assume that prob distributions are always positive`
			`float cval;`
			`int idxmax=-1; // indicates that all pd elements are <0`

			`while (ndim--) {`
			`cval = src[ndim];`
			`if (cval>=cmax) {`
			`cmax = cval;`
			`idxmax = ndim;`
			`}`
			`}`

			`if (pmax)`
			`*pmax = cmax;`

			`return idxmax;`
			`}`