1 files changed, 2100 insertions, 0 deletions
diff --git a/src/libmpg123/layer3.c b/src/libmpg123/layer3.c
new file mode 100755
index 0000000..c7cb8cd
--- /dev/null
+++ b/src/libmpg123/layer3.c
@@ -0,0 +1,2100 @@
+
+/* 
+ * Mpeg Layer-3 audio decoder 
+ * --------------------------
+ * copyright (c) 1995-1999 by Michael Hipp.
+ * All rights reserved. See also 'README'
+ *
+ * Optimize-TODO: put short bands into the band-field without the stride of 3 reals
+ * Length-optimze: unify long and short band code where it is possible
+ */
+
+#include <stdlib.h>
+#include "mpg123.h"
+#include "huffman.h"
+
+#include "getbits.h"
+
+static real ispow[8207];
+static real aa_ca[8], aa_cs[8];
+static real COS1[12][6];
+static real win[4][36];
+static real win1[4][36];
+static real gainpow2[256 + 118 + 4];
+real COS9[9];
+static real COS6_1, COS6_2;
+real tfcos36[9];
+static real tfcos12[3];
+#define NEW_DCT9
+#ifdef NEW_DCT9
+static real cos9[3], cos18[3];
+#endif
+
+struct bandInfoStruct
+{
+	int longIdx[23];
+	int longDiff[22];
+	int shortIdx[14];
+	int shortDiff[13];
+};
+
+int longLimit[9][23];
+int shortLimit[9][14];
+
+/* Used by the getbits macros */
+static unsigned long rval;
+static unsigned char rval_uc;
+
+struct bandInfoStruct bandInfo[9] =
+{
+/* MPEG 1.0 */
+ { {0,4,8,12,16,20,24,30,36,44,52,62,74, 90,110,134,162,196,238,288,342,418,576},
+   {4,4,4,4,4,4,6,6,8, 8,10,12,16,20,24,28,34,42,50,54, 76,158},
+   {0,4*3,8*3,12*3,16*3,22*3,30*3,40*3,52*3,66*3, 84*3,106*3,136*3,192*3},
+   {4,4,4,4,6,8,10,12,14,18,22,30,56} } ,
+
+ { {0,4,8,12,16,20,24,30,36,42,50,60,72, 88,106,128,156,190,230,276,330,384,576},
+   {4,4,4,4,4,4,6,6,6, 8,10,12,16,18,22,28,34,40,46,54, 54,192},
+   {0,4*3,8*3,12*3,16*3,22*3,28*3,38*3,50*3,64*3, 80*3,100*3,126*3,192*3},
+   {4,4,4,4,6,6,10,12,14,16,20,26,66} } ,
+
+ { {0,4,8,12,16,20,24,30,36,44,54,66,82,102,126,156,194,240,296,364,448,550,576} ,
+   {4,4,4,4,4,4,6,6,8,10,12,16,20,24,30,38,46,56,68,84,102, 26} ,
+   {0,4*3,8*3,12*3,16*3,22*3,30*3,42*3,58*3,78*3,104*3,138*3,180*3,192*3} ,
+   {4,4,4,4,6,8,12,16,20,26,34,42,12} }  ,
+
+/* MPEG 2.0 */
+ { {0,6,12,18,24,30,36,44,54,66,80,96,116,140,168,200,238,284,336,396,464,522,576},
+   {6,6,6,6,6,6,8,10,12,14,16,20,24,28,32,38,46,52,60,68,58,54 } ,
+   {0,4*3,8*3,12*3,18*3,24*3,32*3,42*3,56*3,74*3,100*3,132*3,174*3,192*3} ,
+   {4,4,4,6,6,8,10,14,18,26,32,42,18 } } ,
+/*
+ { {0,6,12,18,24,30,36,44,54,66,80,96,114,136,162,194,232,278,330,394,464,540,576},
+   {6,6,6,6,6,6,8,10,12,14,16,18,22,26,32,38,46,52,64,70,76,36 } ,
+*/
+/* changed 19th value fropm 330 to 332 */
+ { {0,6,12,18,24,30,36,44,54,66,80,96,114,136,162,194,232,278,332,394,464,540,576},
+   {6,6,6,6,6,6,8,10,12,14,16,18,22,26,32,38,46,54,62,70,76,36 } ,
+   {0,4*3,8*3,12*3,18*3,26*3,36*3,48*3,62*3,80*3,104*3,136*3,180*3,192*3} ,
+   {4,4,4,6,8,10,12,14,18,24,32,44,12 } } ,
+
+ { {0,6,12,18,24,30,36,44,54,66,80,96,116,140,168,200,238,284,336,396,464,522,576},
+   {6,6,6,6,6,6,8,10,12,14,16,20,24,28,32,38,46,52,60,68,58,54 },
+   {0,4*3,8*3,12*3,18*3,26*3,36*3,48*3,62*3,80*3,104*3,134*3,174*3,192*3},
+   {4,4,4,6,8,10,12,14,18,24,30,40,18 } } ,
+/* MPEG 2.5 */
+ { {0,6,12,18,24,30,36,44,54,66,80,96,116,140,168,200,238,284,336,396,464,522,576} ,
+   {6,6,6,6,6,6,8,10,12,14,16,20,24,28,32,38,46,52,60,68,58,54},
+   {0,12,24,36,54,78,108,144,186,240,312,402,522,576},
+   {4,4,4,6,8,10,12,14,18,24,30,40,18} },
+ { {0,6,12,18,24,30,36,44,54,66,80,96,116,140,168,200,238,284,336,396,464,522,576} ,
+   {6,6,6,6,6,6,8,10,12,14,16,20,24,28,32,38,46,52,60,68,58,54},
+   {0,12,24,36,54,78,108,144,186,240,312,402,522,576},
+   {4,4,4,6,8,10,12,14,18,24,30,40,18} },
+ { {0,12,24,36,48,60,72,88,108,132,160,192,232,280,336,400,476,566,568,570,572,574,576},
+   {12,12,12,12,12,12,16,20,24,28,32,40,48,56,64,76,90,2,2,2,2,2},
+   {0, 24, 48, 72,108,156,216,288,372,480,486,492,498,576},
+   {8,8,8,12,16,20,24,28,36,2,2,2,26} } ,
+};
+
+static int mapbuf0[9][152];
+static int mapbuf1[9][156];
+static int mapbuf2[9][44];
+static int *map[9][3];
+static int *mapend[9][3];
+
+static unsigned int n_slen2[512];	/* MPEG 2.0 slen for 'normal' mode */
+static unsigned int i_slen2[256];	/* MPEG 2.0 slen for intensity stereo */
+
+static real tan1_1[16], tan2_1[16], tan1_2[16], tan2_2[16];
+static real pow1_1[2][16], pow2_1[2][16], pow1_2[2][16], pow2_2[2][16];
+
+/* 
+ * init tables for layer-3 
+ */
+void mpg123_init_layer3(int down_sample_sblimit)
+{
+	int i, j, k, l;
+
+	for (i = -256; i < 118 + 4; i++)
+		gainpow2[i + 256] = pow((double) 2.0, -0.25 * (double) (i + 210));
+
+	for (i = 0; i < 8207; i++)
+		ispow[i] = pow((double) i, (double) 4.0 / 3.0);
+
+	for (i = 0; i < 8; i++)
+	{
+		static double Ci[8] =
+		{-0.6, -0.535, -0.33, -0.185, -0.095, -0.041, -0.0142, -0.0037};
+		double sq = sqrt(1.0 + Ci[i] * Ci[i]);
+
+		aa_cs[i] = 1.0 / sq;
+		aa_ca[i] = Ci[i] / sq;
+	}
+
+	for (i = 0; i < 18; i++)
+	{
+		win[0][i] = win[1][i] = 0.5 * sin(M_PI / 72.0 * (double) (2 * (i + 0) + 1)) / cos(M_PI * (double) (2 * (i + 0) + 19) / 72.0);
+		win[0][i + 18] = win[3][i + 18] = 0.5 * sin(M_PI / 72.0 * (double) (2 * (i + 18) + 1)) / cos(M_PI * (double) (2 * (i + 18) + 19) / 72.0);
+	}
+	for (i = 0; i < 6; i++)
+	{
+		win[1][i + 18] = 0.5 / cos(M_PI * (double) (2 * (i + 18) + 19) / 72.0);
+		win[3][i + 12] = 0.5 / cos(M_PI * (double) (2 * (i + 12) + 19) / 72.0);
+		win[1][i + 24] = 0.5 * sin(M_PI / 24.0 * (double) (2 * i + 13)) / cos(M_PI * (double) (2 * (i + 24) + 19) / 72.0);
+		win[1][i + 30] = win[3][i] = 0.0;
+		win[3][i + 6] = 0.5 * sin(M_PI / 24.0 * (double) (2 * i + 1)) / cos(M_PI * (double) (2 * (i + 6) + 19) / 72.0);
+	}
+
+	for (i = 0; i < 9; i++)
+		COS9[i] = cos(M_PI / 18.0 * (double) i);
+
+	for (i = 0; i < 9; i++)
+		tfcos36[i] = 0.5 / cos(M_PI * (double) (i * 2 + 1) / 36.0);
+	for (i = 0; i < 3; i++)
+		tfcos12[i] = 0.5 / cos(M_PI * (double) (i * 2 + 1) / 12.0);
+
+	COS6_1 = cos(M_PI / 6.0 * (double) 1);
+	COS6_2 = cos(M_PI / 6.0 * (double) 2);
+
+#ifdef NEW_DCT9
+	cos9[0] = cos(1.0 * M_PI / 9.0);
+	cos9[1] = cos(5.0 * M_PI / 9.0);
+	cos9[2] = cos(7.0 * M_PI / 9.0);
+	cos18[0] = cos(1.0 * M_PI / 18.0);
+	cos18[1] = cos(11.0 * M_PI / 18.0);
+	cos18[2] = cos(13.0 * M_PI / 18.0);
+#endif
+
+	for (i = 0; i < 12; i++)
+	{
+		win[2][i] = 0.5 * sin(M_PI / 24.0 * (double) (2 * i + 1)) / cos(M_PI * (double) (2 * i + 7) / 24.0);
+		for (j = 0; j < 6; j++)
+			COS1[i][j] = cos(M_PI / 24.0 * (double) ((2 * i + 7) * (2 * j + 1)));
+	}
+
+	for (j = 0; j < 4; j++)
+	{
+		static int len[4] = { 36, 36, 12, 36 };
+
+		for (i = 0; i < len[j]; i += 2)
+			win1[j][i] = +win[j][i];
+		for (i = 1; i < len[j]; i += 2)
+			win1[j][i] = -win[j][i];
+	}
+
+	for (i = 0; i < 16; i++)
+	{
+		double t = tan((double) i * M_PI / 12.0);
+
+		tan1_1[i] = t / (1.0 + t);
+		tan2_1[i] = 1.0 / (1.0 + t);
+		tan1_2[i] = M_SQRT2 * t / (1.0 + t);
+		tan2_2[i] = M_SQRT2 / (1.0 + t);
+
+		for (j = 0; j < 2; j++)
+		{
+			double base = pow(2.0, -0.25 * (j + 1.0));
+			double p1 = 1.0, p2 = 1.0;
+
+			if (i > 0)
+			{
+				if (i & 1)
+					p1 = pow(base, (i + 1.0) * 0.5);
+				else
+					p2 = pow(base, i * 0.5);
+			}
+			pow1_1[j][i] = p1;
+			pow2_1[j][i] = p2;
+			pow1_2[j][i] = M_SQRT2 * p1;
+			pow2_2[j][i] = M_SQRT2 * p2;
+		}
+	}
+
+	for (j = 0; j < 9; j++)
+	{
+		struct bandInfoStruct *bi = &bandInfo[j];
+		int *mp;
+		int cb, lwin;
+		int *bdf;
+
+		mp = map[j][0] = mapbuf0[j];
+		bdf = bi->longDiff;
+		for (i = 0, cb = 0; cb < 8; cb++, i += *bdf++)
+		{
+			*mp++ = (*bdf) >> 1;
+			*mp++ = i;
+			*mp++ = 3;
+			*mp++ = cb;
+		}
+		bdf = bi->shortDiff + 3;
+		for (cb = 3; cb < 13; cb++)
+		{
+			int l = (*bdf++) >> 1;
+
+			for (lwin = 0; lwin < 3; lwin++)
+			{
+				*mp++ = l;
+				*mp++ = i + lwin;
+				*mp++ = lwin;
+				*mp++ = cb;
+			}
+			i += 6 * l;
+		}
+		mapend[j][0] = mp;
+
+		mp = map[j][1] = mapbuf1[j];
+		bdf = bi->shortDiff + 0;
+		for (i = 0, cb = 0; cb < 13; cb++)
+		{
+			int l = (*bdf++) >> 1;
+
+			for (lwin = 0; lwin < 3; lwin++)
+			{
+				*mp++ = l;
+				*mp++ = i + lwin;
+				*mp++ = lwin;
+				*mp++ = cb;
+			}
+			i += 6 * l;
+		}
+		mapend[j][1] = mp;
+
+		mp = map[j][2] = mapbuf2[j];
+		bdf = bi->longDiff;
+		for (cb = 0; cb < 22; cb++)
+		{
+			*mp++ = (*bdf++) >> 1;
+			*mp++ = cb;
+		}
+		mapend[j][2] = mp;
+
+	}
+
+	for (j = 0; j < 9; j++)
+	{
+		for (i = 0; i < 23; i++)
+		{
+			longLimit[j][i] = (bandInfo[j].longIdx[i] - 1 + 8) / 18 + 1;
+			if (longLimit[j][i] > (down_sample_sblimit))
+				longLimit[j][i] = down_sample_sblimit;
+		}
+		for (i = 0; i < 14; i++)
+		{
+			shortLimit[j][i] = (bandInfo[j].shortIdx[i] - 1) / 18 + 1;
+			if (shortLimit[j][i] > (down_sample_sblimit))
+				shortLimit[j][i] = down_sample_sblimit;
+		}
+	}
+
+	for (i = 0; i < 5; i++)
+	{
+		for (j = 0; j < 6; j++)
+		{
+			for (k = 0; k < 6; k++)
+			{
+				int n = k + j * 6 + i * 36;
+
+				i_slen2[n] = i | (j << 3) | (k << 6) | (3 << 12);
+			}
+		}
+	}
+	for (i = 0; i < 4; i++)
+	{
+		for (j = 0; j < 4; j++)
+		{
+			for (k = 0; k < 4; k++)
+			{
+				int n = k + j * 4 + i * 16;
+
+				i_slen2[n + 180] = i | (j << 3) | (k << 6) | (4 << 12);
+			}
+		}
+	}
+	for (i = 0; i < 4; i++)
+	{
+		for (j = 0; j < 3; j++)
+		{
+			int n = j + i * 3;
+
+			i_slen2[n + 244] = i | (j << 3) | (5 << 12);
+			n_slen2[n + 500] = i | (j << 3) | (2 << 12) | (1 << 15);
+		}
+	}
+
+	for (i = 0; i < 5; i++)
+	{
+		for (j = 0; j < 5; j++)
+		{
+			for (k = 0; k < 4; k++)
+			{
+				for (l = 0; l < 4; l++)
+				{
+					int n = l + k * 4 + j * 16 + i * 80;
+
+					n_slen2[n] = i | (j << 3) | (k << 6) | (l << 9) | (0 << 12);
+				}
+			}
+		}
+	}
+	for (i = 0; i < 5; i++)
+	{
+		for (j = 0; j < 5; j++)
+		{
+			for (k = 0; k < 4; k++)
+			{
+				int n = k + j * 4 + i * 20;
+
+				n_slen2[n + 400] = i | (j << 3) | (k << 6) | (1 << 12);
+			}
+		}
+	}
+}
+
+/*
+ * read additional side information (for MPEG 1 and MPEG 2)
+ */
+static int III_get_side_info(struct III_sideinfo *si, int stereo,
+			      int ms_stereo, long sfreq, int single, int lsf)
+{
+	int ch, gr;
+	int powdiff = (single == 3) ? 4 : 0;
+
+	static const int tabs[2][5] = { {2, 9, 5, 3, 4}, {1, 8, 1, 2, 9} };
+	const int *tab = tabs[lsf];
+
+	si->main_data_begin = mpg123_getbits(tab[1]);
+	if (stereo == 1)
+		si->private_bits = mpg123_getbits_fast(tab[2]);
+	else
+		si->private_bits = mpg123_getbits_fast(tab[3]);
+
+	if (!lsf)
+	{
+		for (ch = 0; ch < stereo; ch++)
+		{
+			si->ch[ch].gr[0].scfsi = -1;
+			si->ch[ch].gr[1].scfsi = mpg123_getbits_fast(4);
+		}
+	}
+
+	for (gr = 0; gr < tab[0]; gr++)
+	{
+		for (ch = 0; ch < stereo; ch++)
+		{
+			register struct gr_info_s *gr_info = &(si->ch[ch].gr[gr]);
+
+			gr_info->part2_3_length = mpg123_getbits(12);
+			gr_info->big_values = mpg123_getbits(9);
+			if (gr_info->big_values > 288)
+			{
+				/*  fprintf(stderr, "big_values too large!\n"); */
+				/*  gr_info->big_values = 288; */
+				return 0;
+			}
+			gr_info->pow2gain = gainpow2 + 256 - mpg123_getbits_fast(8) + powdiff;
+			if (ms_stereo)
+				gr_info->pow2gain += 2;
+			gr_info->scalefac_compress = mpg123_getbits(tab[4]);
+
+			if (mpg123_get1bit())
+			{	/* window switch flag  */
+				int i;
+
+				gr_info->block_type = mpg123_getbits_fast(2);
+				gr_info->mixed_block_flag = mpg123_get1bit();
+				gr_info->table_select[0] = mpg123_getbits_fast(5);
+				gr_info->table_select[1] = mpg123_getbits_fast(5);
+				/*
+				 * table_select[2] not needed, because
+				 * there is no region2, but to satisfy
+				 * some verifications tools we set it
+				 * either.
+				 */
+				gr_info->table_select[2] = 0;
+				for (i = 0; i < 3; i++)
+					gr_info->full_gain[i] = gr_info->pow2gain + (mpg123_getbits_fast(3) << 3);
+
+				if (gr_info->block_type == 0)
+				{
+					/*  fprintf(stderr,	"Blocktype == 0 and window-switching == 1 not allowed.\n"); */
+					/*  exit(1); */
+					return 0;
+				}
+
+				/* region_count/start parameters are implicit in this case. */
+				if (!lsf || gr_info->block_type == 2)
+					gr_info->region1start = 36 >> 1;
+				else
+				{
+					/* check this again for 2.5 and sfreq=8 */
+					if (sfreq == 8)
+						gr_info->region1start =	108 >> 1;
+					else
+						gr_info->region1start =	54 >> 1;
+				}
+				gr_info->region2start = 576 >> 1;
+			}
+			else
+			{
+				int i, r0c, r1c;
+
+				for (i = 0; i < 3; i++)
+					gr_info->table_select[i] = mpg123_getbits_fast(5);
+				r0c = mpg123_getbits_fast(4);
+				r1c = mpg123_getbits_fast(3);
+				gr_info->region1start = bandInfo[sfreq].longIdx[r0c + 1] >> 1;
+				if (r0c + r1c + 2 > 22)
+					gr_info->region2start = 576 >> 1;
+				else
+					gr_info->region2start = bandInfo[sfreq].longIdx[r0c + 1 + r1c + 1] >> 1;
+				gr_info->block_type = 0;
+				gr_info->mixed_block_flag = 0;
+			}
+			if (!lsf)
+				gr_info->preflag = mpg123_get1bit();
+			gr_info->scalefac_scale = mpg123_get1bit();
+			gr_info->count1table_select = mpg123_get1bit();
+		}
+	}
+	return 1;
+}
+
+
+/*
+ * read scalefactors
+ */
+static int III_get_scale_factors_1(int *scf, struct gr_info_s *gr_info)
+{
+	static const unsigned char slen[2][16] = {
+		{0, 0, 0, 0, 3, 1, 1, 1, 2, 2, 2, 3, 3, 3, 4, 4},
+		{0, 1, 2, 3, 0, 1, 2, 3, 1, 2, 3, 1, 2, 3, 2, 3}
+	};
+	int numbits;
+	int num0 = slen[0][gr_info->scalefac_compress];
+	int num1 = slen[1][gr_info->scalefac_compress];
+
+	if (gr_info->block_type == 2)
+	{
+		int i = 18;
+
+		numbits = (num0 + num1) * 18;
+
+		if (gr_info->mixed_block_flag)
+		{
+			for (i = 8; i; i--)
+				*scf++ = mpg123_getbits_fast(num0);
+			i = 9;
+			numbits -= num0;	/* num0 * 17 + num1 * 18 */
+		}
+
+		for (; i; i--)
+			*scf++ = mpg123_getbits_fast(num0);
+		for (i = 18; i; i--)
+			*scf++ = mpg123_getbits_fast(num1);
+		*scf++ = 0;
+		*scf++ = 0;
+		*scf++ = 0;	/* short[13][0..2] = 0 */
+	}
+	else
+	{
+		int i;
+		int scfsi = gr_info->scfsi;
+
+		if (scfsi < 0)
+		{		/* scfsi < 0 => granule == 0 */
+			for (i = 11; i; i--)
+				*scf++ = mpg123_getbits_fast(num0);
+			for (i = 10; i; i--)
+				*scf++ = mpg123_getbits_fast(num1);
+			numbits = (num0 + num1) * 10 + num0;
+			*scf++ = 0;
+		}
+		else
+		{
+			numbits = 0;
+			if (!(scfsi & 0x8))
+			{
+				for (i = 0; i < 6; i++)
+					*scf++ = mpg123_getbits_fast(num0);
+				numbits += num0 * 6;
+			}
+			else
+			{
+				scf += 6;
+			}
+
+			if (!(scfsi & 0x4))
+			{
+				for (i = 0; i < 5; i++)
+					*scf++ = mpg123_getbits_fast(num0);
+				numbits += num0 * 5;
+			}
+			else
+			{
+				scf += 5;
+			}
+
+			if (!(scfsi & 0x2))
+			{
+				for (i = 0; i < 5; i++)
+					*scf++ = mpg123_getbits_fast(num1);
+				numbits += num1 * 5;
+			}
+			else
+			{
+				scf += 5;
+			}
+
+			if (!(scfsi & 0x1))
+			{
+				for (i = 0; i < 5; i++)
+					*scf++ = mpg123_getbits_fast(num1);
+				numbits += num1 * 5;
+			}
+			else
+			{
+				scf += 5;
+			}
+			*scf++ = 0;	/* no l[21] in original sources */
+		}
+	}
+	return numbits;
+}
+
+static int III_get_scale_factors_2(int *scf, struct gr_info_s *gr_info, int i_stereo)
+{
+	unsigned char *pnt;
+	int i, j, n = 0, numbits = 0;
+	unsigned int slen;
+
+	static unsigned char stab[3][6][4] =
+	{
+		{{6, 5, 5, 5}, {6, 5, 7, 3}, {11, 10, 0, 0},
+		 {7, 7, 7, 0}, {6, 6, 6, 3}, {8, 8, 5, 0}},
+		{{9, 9, 9, 9}, {9, 9, 12, 6}, {18, 18, 0, 0},
+		 {12, 12, 12, 0}, {12, 9, 9, 6}, {15, 12, 9, 0}},
+		{{6, 9, 9, 9}, {6, 9, 12, 6}, {15, 18, 0, 0},
+		 {6, 15, 12, 0}, {6, 12, 9, 6}, {6, 18, 9, 0}}
+	};
+
+	if (i_stereo)		/* i_stereo AND second channel -> mpg123_do_layer3() checks this */
+		slen = i_slen2[gr_info->scalefac_compress >> 1];
+	else
+		slen = n_slen2[gr_info->scalefac_compress];
+
+	gr_info->preflag = (slen >> 15) & 0x1;
+
+	n = 0;
+	if (gr_info->block_type == 2)
+	{
+		n++;
+		if (gr_info->mixed_block_flag)
+			n++;
+	}
+
+	pnt = stab[n][(slen >> 12) & 0x7];
+
+	for (i = 0; i < 4; i++)
+	{
+		int num = slen & 0x7;
+
+		slen >>= 3;
+		if (num)
+		{
+			for (j = 0; j < (int) (pnt[i]); j++)
+				*scf++ = mpg123_getbits_fast(num);
+			numbits += pnt[i] * num;
+		}
+		else
+		{
+			for (j = 0; j < (int) (pnt[i]); j++)
+				*scf++ = 0;
+		}
+	}
+
+	n = (n << 1) + 1;
+	for (i = 0; i < n; i++)
+		*scf++ = 0;
+
+	return numbits;
+}
+
+static int pretab1[22] =
+{0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 3, 3, 3, 2, 0};
+static int pretab2[22] =
+{0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0};
+
+/*
+ * Dequantize samples (includes huffman decoding)
+ */
+/* 24 is enough because tab13 has max. a 19 bit huffvector */
+#define BITSHIFT (int)((sizeof (long) - 1) * 8)
+
+#define REFRESH_MASK()							\
+while(num < BITSHIFT) {							\
+	mask |= ((unsigned long)mpg123_getbyte()) << (BITSHIFT - num);	\
+	num += 8;							\
+	part2remain -= 8;						\
+}
+
+static int III_dequantize_sample(real xr[SBLIMIT][SSLIMIT], int *scf,
+			struct gr_info_s *gr_info, int sfreq, int part2bits)
+{
+	int shift = 1 + gr_info->scalefac_scale;
+	real *xrpnt = (real *) xr;
+	int l[3], l3;
+	int part2remain = gr_info->part2_3_length - part2bits;
+	int *me;
+
+	int num = mpg123_getbitoffset();
+	long mask;
+	/* we must split this, because for num==0 the shift is undefined if you do it in one step */
+	mask = ((unsigned long) mpg123_getbits(num)) << BITSHIFT;
+	mask <<= 8 - num;
+	part2remain -= num;
+
+	{
+		int bv = gr_info->big_values;
+		int region1 = gr_info->region1start;
+		int region2 = gr_info->region2start;
+
+		l3 = ((576 >> 1) - bv) >> 1;
+/*
+ * we may lose the 'odd' bit here !! 
+ * check this later again 
+ */
+		if (bv <= region1)
+		{
+			l[0] = bv;
+			l[1] = 0;
+			l[2] = 0;
+		}
+		else
+		{
+			l[0] = region1;
+			if (bv <= region2)
+			{
+				l[1] = bv - l[0];
+				l[2] = 0;
+			}
+			else
+			{
+				l[1] = region2 - l[0];
+				l[2] = bv - region2;
+			}
+		}
+	}
+
+	if (gr_info->block_type == 2)
+	{
+		/*
+		 * decoding with short or mixed mode BandIndex table 
+		 */
+		int i, max[4];
+		int step = 0, lwin = 3, cb = 0;
+		register real v = 0.0;
+		register int *m, mc;
+
+		if (gr_info->mixed_block_flag)
+		{
+			max[3] = -1;
+			max[0] = max[1] = max[2] = 2;
+			m = map[sfreq][0];
+			me = mapend[sfreq][0];
+		}
+		else
+		{
+			max[0] = max[1] = max[2] = max[3] = -1;
+			/* max[3] not really needed in this case */
+			m = map[sfreq][1];
+			me = mapend[sfreq][1];
+		}
+
+		mc = 0;
+		for (i = 0; i < 2; i++)
+		{
+			int lp = l[i];
+			struct newhuff *h = ht + gr_info->table_select[i];
+
+			for (; lp; lp--, mc--)
+			{
+				register int x, y;
+				if ((!mc))
+				{
+					mc = *m++;
+					xrpnt = ((real *) xr) + (*m++);
+					lwin = *m++;
+					cb = *m++;
+					if (lwin == 3)
+					{
+						v = gr_info->pow2gain[(*scf++) << shift];
+						step = 1;
+					}
+					else
+					{
+						v = gr_info->full_gain[lwin][(*scf++) << shift];
+						step = 3;
+					}
+				}
+				{
+					register short *val = h->table;
+
+					REFRESH_MASK();
+					while ((y = *val++) < 0)
+					{
+						if (mask < 0)
+							val -= y;
+						num--;
+						mask <<= 1;
+					}
+					x = y >> 4;
+					y &= 0xf;
+				}
+				if (x == 15 && h->linbits)
+				{
+					max[lwin] = cb;
+					REFRESH_MASK();
+					x += ((unsigned long) mask) >> (BITSHIFT + 8 - h->linbits);
+					num -= h->linbits + 1;
+					mask <<= h->linbits;
+					if (mask < 0)
+						*xrpnt = -ispow[x] * v;
+					else
+						*xrpnt = ispow[x] * v;
+					mask <<= 1;
+				}
+				else if (x)
+				{
+					max[lwin] = cb;
+					if (mask < 0)
+						*xrpnt = -ispow[x] * v;
+					else
+						*xrpnt = ispow[x] * v;
+					num--;
+					mask <<= 1;
+				}
+				else
+					*xrpnt = 0.0;
+				xrpnt += step;
+				if (y == 15 && h->linbits)
+				{
+					max[lwin] = cb;
+					REFRESH_MASK();
+					y += ((unsigned long) mask) >> (BITSHIFT + 8 - h->linbits);
+					num -= h->linbits + 1;
+					mask <<= h->linbits;
+					if (mask < 0)
+						*xrpnt = -ispow[y] * v;
+					else
+						*xrpnt = ispow[y] * v;
+					mask <<= 1;
+				}
+				else if (y)
+				{
+					max[lwin] = cb;
+					if (mask < 0)
+						*xrpnt = -ispow[y] * v;
+					else
+						*xrpnt = ispow[y] * v;
+					num--;
+					mask <<= 1;
+				}
+				else
+					*xrpnt = 0.0;
+				xrpnt += step;
+			}
+		}
+
+		for (; l3 && (part2remain + num > 0); l3--)
+		{
+			struct newhuff *h = htc + gr_info->count1table_select;
+			register short *val = h->table, a;
+
+			REFRESH_MASK();
+			while ((a = *val++) < 0)
+			{
+				if (mask < 0)
+					val -= a;
+				num--;
+				mask <<= 1;
+			}
+			if (part2remain + num <= 0)
+			{
+				num -= part2remain + num;
+				break;
+			}
+
+			for (i = 0; i < 4; i++)
+			{
+				if (!(i & 1))
+				{
+					if (!mc)
+					{
+						mc = *m++;
+						xrpnt =	((real *) xr) + (*m++);
+						lwin = *m++;
+						cb = *m++;
+						if (lwin == 3)
+						{
+							v = gr_info->pow2gain[(*scf++) << shift];
+							step = 1;
+						}
+						else
+						{
+							v = gr_info->full_gain[lwin][(*scf++) << shift];
+							step = 3;
+						}
+					}
+					mc--;
+				}
+				if ((a & (0x8 >> i)))
+				{
+					max[lwin] = cb;
+					if (part2remain + num <= 0)
+					{
+						break;
+					}
+					if (mask < 0)
+						*xrpnt = -v;
+					else
+						*xrpnt = v;
+					num--;
+					mask <<= 1;
+				}
+				else
+					*xrpnt = 0.0;
+				xrpnt += step;
+			}
+		}
+
+		if (lwin < 3)
+		{		/* short band? */
+			while (1)
+			{
+				/* HACK Prevent overflowing the xr buffer */
+				if (mc * 6 > &xr[SBLIMIT][SSLIMIT] - xrpnt)
+					return 1;
+					
+				for (; mc > 0; mc--)
+				{
+					*xrpnt = 0.0;
+					xrpnt += 3;	/* short band -> step=3 */
+					*xrpnt = 0.0;
+					xrpnt += 3;
+				}
+				if (m >= me)
+					break;
+				mc = *m++;
+				xrpnt = ((real *) xr) + *m++;
+				if (*m++ == 0)
+					break;	/* optimize: field will be set to zero at the end of the function */
+				m++;	/* cb */
+			}
+		}
+
+		gr_info->maxband[0] = max[0] + 1;
+		gr_info->maxband[1] = max[1] + 1;
+		gr_info->maxband[2] = max[2] + 1;
+		gr_info->maxbandl = max[3] + 1;
+
+		{
+			int rmax = max[0] > max[1] ? max[0] : max[1];
+
+			rmax = (rmax > max[2] ? rmax : max[2]) + 1;
+			gr_info->maxb = rmax ? shortLimit[sfreq][rmax] : longLimit[sfreq][max[3] + 1];
+		}
+
+	}
+	else
+	{
+		/*
+		 * decoding with 'long' BandIndex table (block_type != 2)
+		 */
+		int *pretab = gr_info->preflag ? pretab1 : pretab2;
+		int i, max = -1;
+		int cb = 0;
+		int *m = map[sfreq][2];
+		register real v = 0.0;
+		int mc = 0;
+
+		/*
+		 * long hash table values
+		 */
+		for (i = 0; i < 3; i++)
+		{
+			int lp = l[i];
+			struct newhuff *h = ht + gr_info->table_select[i];
+
+			for (; lp; lp--, mc--)
+			{
+				int x, y;
+
+				if (!mc)
+				{
+					mc = *m++;
+					cb = *m++;
+/*  					if (cb == 21) */
+/*  						v = 0.0; */
+/*  					else */
+						v = gr_info->pow2gain[((*scf++) + (*pretab++)) << shift];
+
+				}
+				{
+					register short *val = h->table;
+					REFRESH_MASK();
+					while ((y = *val++) < 0)
+					{
+						if (mask < 0)
+							val -= y;
+						num--;
+						mask <<= 1;
+					}
+					x = y >> 4;
+					y &= 0xf;
+				}
+
+				if (x == 15 && h->linbits)
+				{
+					max = cb;
+					REFRESH_MASK();
+					x += ((unsigned long) mask) >> (BITSHIFT + 8 - h->linbits);
+					num -= h->linbits + 1;
+					mask <<= h->linbits;
+					if (mask < 0)
+						*xrpnt++ = -ispow[x] * v;
+					else
+						*xrpnt++ = ispow[x] * v;
+					mask <<= 1;
+				}
+				else if (x)
+				{
+					max = cb;
+					if (mask < 0)
+						*xrpnt++ = -ispow[x] * v;
+					else
+						*xrpnt++ = ispow[x] * v;
+					num--;
+					mask <<= 1;
+				}
+				else
+					*xrpnt++ = 0.0;
+
+				if (y == 15 && h->linbits)
+				{
+					max = cb;
+					REFRESH_MASK();
+					y += ((unsigned long) mask) >> (BITSHIFT + 8 - h->linbits);
+					num -= h->linbits + 1;
+					mask <<= h->linbits;
+					if (mask < 0)
+						*xrpnt++ = -ispow[y] * v;
+					else
+						*xrpnt++ = ispow[y] * v;
+					mask <<= 1;
+				}
+				else if (y)
+				{
+					max = cb;
+					if (mask < 0)
+						*xrpnt++ = -ispow[y] * v;
+					else
+						*xrpnt++ = ispow[y] * v;
+					num--;
+					mask <<= 1;
+				}
+				else
+					*xrpnt++ = 0.0;
+			}
+		}
+
+		/*
+		 * short (count1table) values
+		 */
+		for (; l3 && (part2remain + num > 0); l3--)
+		{
+			struct newhuff *h = htc + gr_info->count1table_select;
+			register short *val = h->table, a;
+
+			REFRESH_MASK();
+			while ((a = *val++) < 0)
+			{
+				if (mask < 0)
+					val -= a;
+				num--;
+				mask <<= 1;
+			}
+			if (part2remain + num <= 0)
+			{
+				num -= part2remain + num;
+				break;
+			}
+
+			for (i = 0; i < 4; i++)
+			{
+				if (!(i & 1))
+				{
+					if (!mc)
+					{
+						mc = *m++;
+						cb = *m++;
+/*  						if (cb == 21) */
+/*  							v = 0.0; */
+/*  						else */
+							v = gr_info->pow2gain[((*scf++) + (*pretab++)) << shift];
+					}
+					mc--;
+				}
+				if ((a & (0x8 >> i)))
+				{
+					max = cb;
+					if (part2remain + num <= 0)
+					{
+						break;
+					}
+					if (mask < 0)
+						*xrpnt++ = -v;
+					else
+						*xrpnt++ = v;
+					num--;
+					mask <<= 1;
+				}
+				else
+					*xrpnt++ = 0.0;
+			}
+		}
+
+		gr_info->maxbandl = max + 1;
+		gr_info->maxb = longLimit[sfreq][gr_info->maxbandl];
+	}
+
+	part2remain += num;
+	mpg123_backbits(num);
+	num = 0;
+
+	while (xrpnt < &xr[SBLIMIT][0])
+		*xrpnt++ = 0.0;
+
+	while (part2remain > 16)
+	{
+		mpg123_getbits(16);	/* Dismiss stuffing Bits */
+		part2remain -= 16;
+	}
+	if (part2remain > 0)
+		mpg123_getbits(part2remain);
+	else if (part2remain < 0)
+	{
+/*  		fprintf(stderr, "mpg123: Can't rewind stream by %d bits!\n", */
+/*  			-part2remain); */
+		return 1;	/* -> error */
+	}
+	return 0;
+}
+
+/* 
+ * III_stereo: calculate real channel values for Joint-I-Stereo-mode
+ */
+static void III_i_stereo(real xr_buf[2][SBLIMIT][SSLIMIT], int *scalefac, struct gr_info_s *gr_info, int sfreq, int ms_stereo, int lsf)
+{
+	real(*xr)[SBLIMIT * SSLIMIT] = (real(*)[SBLIMIT * SSLIMIT]) xr_buf;
+	struct bandInfoStruct *bi = &bandInfo[sfreq];
+
+	const real *tab1, *tab2;
+
+#if 1
+	int tab;
+	static const real *tabs[3][2][2] = {
+		{{tan1_1, tan2_1}, {tan1_2, tan2_2}},
+		{{pow1_1[0], pow2_1[0]}, {pow1_2[0], pow2_2[0]}},
+		{{pow1_1[1], pow2_1[1]}, {pow1_2[1], pow2_2[1]}}
+	};
+
+	tab = lsf + (gr_info->scalefac_compress & lsf);
+	tab1 = tabs[tab][ms_stereo][0];
+	tab2 = tabs[tab][ms_stereo][1];
+#else
+	if (lsf)
+	{
+		int p = gr_info->scalefac_compress & 0x1;
+
+		if (ms_stereo)
+		{
+			tab1 = pow1_2[p];
+			tab2 = pow2_2[p];
+		}
+		else
+		{
+			tab1 = pow1_1[p];
+			tab2 = pow2_1[p];
+		}
+	}
+	else
+	{
+		if (ms_stereo)
+		{
+			tab1 = tan1_2;
+			tab2 = tan2_2;
+		}
+		else
+		{
+			tab1 = tan1_1;
+			tab2 = tan2_1;
+		}
+	}
+#endif
+
+	if (gr_info->block_type == 2)
+	{
+		int lwin, do_l = 0;
+
+		if (gr_info->mixed_block_flag)
+			do_l = 1;
+
+		for (lwin = 0; lwin < 3; lwin++)
+		{	/* process each window */
+			/* get first band with zero values */
+			int is_p, sb, idx, sfb = gr_info->maxband[lwin];	/* sfb is minimal 3 for mixed mode */
+
+			if (sfb > 3)
+				do_l = 0;
+
+			for (; sfb < 12; sfb++)
+			{
+				is_p = scalefac[sfb * 3 + lwin - gr_info->mixed_block_flag];	/* scale: 0-15 */
+				if (is_p != 7)
+				{
+					real t1, t2;
+
+					sb = bi->shortDiff[sfb];
+					idx = bi->shortIdx[sfb] + lwin;
+					t1 = tab1[is_p];
+					t2 = tab2[is_p];
+					for (; sb > 0; sb--, idx += 3)
+					{
+						real v = xr[0][idx];
+
+						xr[0][idx] = v * t1;
+						xr[1][idx] = v * t2;
+					}
+				}
+			}
+
+#if 1
+/* in the original: copy 10 to 11 , here: copy 11 to 12 
+   maybe still wrong??? (copy 12 to 13?) */
+			is_p = scalefac[11 * 3 + lwin - gr_info->mixed_block_flag];	/* scale: 0-15 */
+			sb = bi->shortDiff[12];
+			idx = bi->shortIdx[12] + lwin;
+#else
+			is_p = scalefac[10 * 3 + lwin - gr_info->mixed_block_flag];	/* scale: 0-15 */
+			sb = bi->shortDiff[11];
+			idx = bi->shortIdx[11] + lwin;
+#endif
+			if (is_p != 7)
+			{
+				real t1, t2;
+				t1 = tab1[is_p];
+				t2 = tab2[is_p];
+				for (; sb > 0; sb--, idx += 3)
+				{
+					real v = xr[0][idx];
+					xr[0][idx] = v * t1;
+					xr[1][idx] = v * t2;
+				}
+			}
+		}		/* end for(lwin; .. ; . ) */
+
+/* also check l-part, if ALL bands in the three windows are 'empty'
+ * and mode = mixed_mode 
+ */
+		if (do_l)
+		{
+			int sfb = gr_info->maxbandl;
+			int idx = bi->longIdx[sfb];
+
+			for (; sfb < 8; sfb++)
+			{
+				int sb = bi->longDiff[sfb];
+				int is_p = scalefac[sfb];	/* scale: 0-15 */
+
+				if (is_p != 7)
+				{
+					real t1, t2;
+
+					t1 = tab1[is_p];
+					t2 = tab2[is_p];
+					for (; sb > 0; sb--, idx++)
+					{
+						real v = xr[0][idx];
+
+						xr[0][idx] = v * t1;
+						xr[1][idx] = v * t2;
+					}
+				}
+				else
+					idx += sb;
+			}
+		}
+	}
+	else
+	{			/* ((gr_info->block_type != 2)) */
+		int sfb = gr_info->maxbandl;
+		int is_p, idx = bi->longIdx[sfb];
+
+/* hmm ... maybe the maxbandl stuff for i-stereo is buggy? */
+		if (sfb <= 21)
+ 		{
+			for (; sfb < 21; sfb++)
+			{
+				int sb = bi->longDiff[sfb];
+
+				is_p = scalefac[sfb];	/* scale: 0-15 */
+				if (is_p != 7)
+				{
+					real t1, t2;
+					t1 = tab1[is_p];
+					t2 = tab2[is_p];
+					for (; sb > 0; sb--, idx++)
+					{
+						real v = xr[0][idx];
+						xr[0][idx] = v * t1;
+						xr[1][idx] = v * t2;
+					}
+				}
+				else
+					idx += sb;
+			}
+
+			is_p = scalefac[20];
+			if (is_p != 7)
+			{		/* copy l-band 20 to l-band 21 */
+				int sb;
+				real t1 = tab1[is_p], t2 = tab2[is_p];
+
+				for (sb = bi->longDiff[21]; sb > 0; sb--, idx++)
+				{
+					real v = xr[0][idx];
+
+					xr[0][idx] = v * t1;
+					xr[1][idx] = v * t2;
+				}
+			}
+		}
+	}		/* ... */
+}
+
+static void III_antialias(real xr[SBLIMIT][SSLIMIT], struct gr_info_s *gr_info)
+{
+	int sblim;
+
+	if (gr_info->block_type == 2)
+	{
+		if (!gr_info->mixed_block_flag)
+			return;
+		sblim = 1;
+	}
+	else
+	{
+		sblim = gr_info->maxb - 1;
+	}
+
+	/* 31 alias-reduction operations between each pair of sub-bands */
+	/* with 8 butterflies between each pair                         */
+
+	{
+		int sb;
+		real *xr1 = (real *) xr[1];
+
+		if (sblim < 1 || sblim > SBLIMIT)
+			return;
+		
+		for (sb = sblim; sb; sb--, xr1 += 10)
+		{
+			int ss;
+			real *cs = aa_cs, *ca = aa_ca;
+			real *xr2 = xr1;
+
+			for (ss = 7; ss >= 0; ss--)
+			{	/* upper and lower butterfly inputs */
+				register real bu = *--xr2, bd = *xr1;
+
+				*xr2 = (bu * (*cs)) - (bd * (*ca));
+				*xr1++ = (bd * (*cs++)) + (bu * (*ca++));
+			}
+		}
+	}
+}
+
+/* 
+ This is an optimized DCT from Jeff Tsay's maplay 1.2+ package.
+ Saved one multiplication by doing the 'twiddle factor' stuff
+ together with the window mul. (MH)
+
+ This uses Byeong Gi Lee's Fast Cosine Transform algorithm, but the
+ 9 point IDCT needs to be reduced further. Unfortunately, I don't
+ know how to do that, because 9 is not an even number. - Jeff.
+
+ ****************************************************************
+
+ 9 Point Inverse Discrete Cosine Transform
+
+ This piece of code is Copyright 1997 Mikko Tommila and is freely usable
+ by anybody. The algorithm itself is of course in the public domain.
+
+ Again derived heuristically from the 9-point WFTA.
+
+ The algorithm is optimized (?) for speed, not for small rounding errors or
+ good readability.
+
+ 36 additions, 11 multiplications
+
+ Again this is very likely sub-optimal.
+
+ The code is optimized to use a minimum number of temporary variables,
+ so it should compile quite well even on 8-register Intel x86 processors.
+ This makes the code quite obfuscated and very difficult to understand.
+
+ References:
+ [1] S. Winograd: "On Computing the Discrete Fourier Transform",
+     Mathematics of Computation, Volume 32, Number 141, January 1978,
+     Pages 175-199
+*/
+
+/*------------------------------------------------------------------*/
+/*                                                                  */
+/*    Function: Calculation of the inverse MDCT                     */
+/*                                                                  */
+/*------------------------------------------------------------------*/
+
+#ifdef USE_3DNOW
+void dct36(real *inbuf,real *o1,real *o2,real *wintab,real *tsbuf)
+#else
+static void dct36(real * inbuf, real * o1, real * o2, real * wintab, real * tsbuf)
+#endif
+{
+#ifdef NEW_DCT9
+	real tmp[18];
+#endif
+
+	{
+		register real *in = inbuf;
+
+		in[17] += in[16];
+		in[16] += in[15];
+		in[15] += in[14];
+		in[14] += in[13];
+		in[13] += in[12];
+		in[12] += in[11];
+		in[11] += in[10];
+		in[10] += in[9];
+		in[9] += in[8];
+		in[8] += in[7];
+		in[7] += in[6];
+		in[6] += in[5];
+		in[5] += in[4];
+		in[4] += in[3];
+		in[3] += in[2];
+		in[2] += in[1];
+		in[1] += in[0];
+
+		in[17] += in[15];
+		in[15] += in[13];
+		in[13] += in[11];
+		in[11] += in[9];
+		in[9] += in[7];
+		in[7] += in[5];
+		in[5] += in[3];
+		in[3] += in[1];
+
+
+#ifdef NEW_DCT9
+#if 1
+		{
+			real t3;
+			{
+				real t0, t1, t2;
+
+				t0 = COS6_2 * (in[8] + in[16] - in[4]);
+				t1 = COS6_2 * in[12];
+
+				t3 = in[0];
+				t2 = t3 - t1 - t1;
+				tmp[1] = tmp[7] = t2 - t0;
+				tmp[4] = t2 + t0 + t0;
+				t3 += t1;
+
+				t2 = COS6_1 * (in[10] + in[14] - in[2]);
+				tmp[1] -= t2;
+				tmp[7] += t2;
+			}
+			{
+				real t0, t1, t2;
+
+				t0 = cos9[0] * (in[4] + in[8]);
+				t1 = cos9[1] * (in[8] - in[16]);
+				t2 = cos9[2] * (in[4] + in[16]);
+
+				tmp[2] = tmp[6] = t3 - t0 - t2;
+				tmp[0] = tmp[8] = t3 + t0 + t1;
+				tmp[3] = tmp[5] = t3 - t1 + t2;
+			}
+		}
+		{
+			real t1, t2, t3;
+
+			t1 = cos18[0] * (in[2] + in[10]);
+			t2 = cos18[1] * (in[10] - in[14]);
+			t3 = COS6_1 * in[6];
+
+			{
+				real t0 = t1 + t2 + t3;
+				tmp[0] += t0;
+				tmp[8] -= t0;
+			}
+
+			t2 -= t3;
+			t1 -= t3;
+
+			t3 = cos18[2] * (in[2] + in[14]);
+
+			t1 += t3;
+			tmp[3] += t1;
+			tmp[5] -= t1;
+
+			t2 -= t3;
+			tmp[2] += t2;
+			tmp[6] -= t2;
+		}
+
+#else
+		{
+			real t0, t1, t2, t3, t4, t5, t6, t7;
+
+			t1 = COS6_2 * in[12];
+			t2 = COS6_2 * (in[8] + in[16] - in[4]);
+
+			t3 = in[0] + t1;
+			t4 = in[0] - t1 - t1;
+			t5 = t4 - t2;
+			tmp[4] = t4 + t2 + t2;
+
+			t0 = cos9[0] * (in[4] + in[8]);
+			t1 = cos9[1] * (in[8] - in[16]);
+
+			t2 = cos9[2] * (in[4] + in[16]);
+
+			t6 = t3 - t0 - t2;
+			t0 += t3 + t1;
+			t3 += t2 - t1;
+
+			t2 = cos18[0] * (in[2] + in[10]);
+			t4 = cos18[1] * (in[10] - in[14]);
+			t7 = COS6_1 * in[6];
+
+			t1 = t2 + t4 + t7;
+			tmp[0] = t0 + t1;
+			tmp[8] = t0 - t1;
+			t1 = cos18[2] * (in[2] + in[14]);
+			t2 += t1 - t7;
+
+			tmp[3] = t3 + t2;
+			t0 = COS6_1 * (in[10] + in[14] - in[2]);
+			tmp[5] = t3 - t2;
+
+			t4 -= t1 + t7;
+
+			tmp[1] = t5 - t0;
+			tmp[7] = t5 + t0;
+			tmp[2] = t6 + t4;
+			tmp[6] = t6 - t4;
+		}
+#endif
+
+		{
+			real t0, t1, t2, t3, t4, t5, t6, t7;
+
+			t1 = COS6_2 * in[13];
+			t2 = COS6_2 * (in[9] + in[17] - in[5]);
+
+			t3 = in[1] + t1;
+			t4 = in[1] - t1 - t1;
+			t5 = t4 - t2;
+
+			t0 = cos9[0] * (in[5] + in[9]);
+			t1 = cos9[1] * (in[9] - in[17]);
+
+			tmp[13] = (t4 + t2 + t2) * tfcos36[17 - 13];
+			t2 = cos9[2] * (in[5] + in[17]);
+
+			t6 = t3 - t0 - t2;
+			t0 += t3 + t1;
+			t3 += t2 - t1;
+
+			t2 = cos18[0] * (in[3] + in[11]);
+			t4 = cos18[1] * (in[11] - in[15]);
+			t7 = COS6_1 * in[7];
+
+			t1 = t2 + t4 + t7;
+			tmp[17] = (t0 + t1) * tfcos36[17 - 17];
+			tmp[9] = (t0 - t1) * tfcos36[17 - 9];
+			t1 = cos18[2] * (in[3] + in[15]);
+			t2 += t1 - t7;
+
+			tmp[14] = (t3 + t2) * tfcos36[17 - 14];
+			t0 = COS6_1 * (in[11] + in[15] - in[3]);
+			tmp[12] = (t3 - t2) * tfcos36[17 - 12];
+
+			t4 -= t1 + t7;
+
+			tmp[16] = (t5 - t0) * tfcos36[17 - 16];
+			tmp[10] = (t5 + t0) * tfcos36[17 - 10];
+			tmp[15] = (t6 + t4) * tfcos36[17 - 15];
+			tmp[11] = (t6 - t4) * tfcos36[17 - 11];
+		}
+
+#define MACRO(v)						\
+do {								\
+	real tmpval;						\
+								\
+	tmpval = tmp[(v)] + tmp[17-(v)];			\
+	out2[9+(v)] = tmpval * w[27+(v)];			\
+	out2[8-(v)] = tmpval * w[26-(v)];			\
+	tmpval = tmp[(v)] - tmp[17-(v)];			\
+	ts[SBLIMIT*(8-(v))] = out1[8-(v)] + tmpval * w[8-(v)];	\
+	ts[SBLIMIT*(9+(v))] = out1[9+(v)] + tmpval * w[9+(v)];	\
+} while (0)
+
+		{
+			register real *out2 = o2;
+			register real *w = wintab;
+			register real *out1 = o1;
+			register real *ts = tsbuf;
+
+			MACRO(0);
+			MACRO(1);
+			MACRO(2);
+			MACRO(3);
+			MACRO(4);
+			MACRO(5);
+			MACRO(6);
+			MACRO(7);
+			MACRO(8);
+		}
+
+#else
+
+		{
+
+#define MACRO0(v)						\
+do {								\
+	real tmp;						\
+	out2[9+(v)] = (tmp = sum0 + sum1) * w[27+(v)];		\
+	out2[8-(v)] = tmp * w[26-(v)];				\
+	sum0 -= sum1;						\
+	ts[SBLIMIT*(8-(v))] = out1[8-(v)] + sum0 * w[8-(v)];	\
+	ts[SBLIMIT*(9+(v))] = out1[9+(v)] + sum0 * w[9+(v)];	\
+} while (0)
+
+#define MACRO1(v)				\
+do {						\
+	real sum0,sum1;				\
+	sum0 = tmp1a + tmp2a;			\
+	sum1 = (tmp1b + tmp2b) * tfcos36[(v)];	\
+	MACRO0(v);				\
+} while (0)
+
+#define MACRO2(v)				\
+do {						\
+	real sum0, sum1;			\
+	sum0 = tmp2a - tmp1a;			\
+	sum1 = (tmp2b - tmp1b) * tfcos36[(v)];	\
+	MACRO0(v);				\
+} while (0)
+
+			register const real *c = COS9;
+			register real *out2 = o2;
+			register real *w = wintab;
+			register real *out1 = o1;
+			register real *ts = tsbuf;
+
+			real ta33, ta66, tb33, tb66;
+
+			ta33 = in[2 * 3 + 0] * c[3];
+			ta66 = in[2 * 6 + 0] * c[6] + in[2 * 0 + 0];
+			tb33 = in[2 * 3 + 1] * c[3];
+			tb66 = in[2 * 6 + 1] * c[6] + in[2 * 0 + 1];
+
+			{
+				real tmp1a, tmp2a, tmp1b, tmp2b;
+				tmp1a =	in[2 * 1 + 0] * c[1] + ta33 + in[2 * 5 + 0] * c[5] + in[2 * 7 + 0] * c[7];
+				tmp1b =	in[2 * 1 + 1] * c[1] + tb33 + in[2 * 5 + 1] * c[5] + in[2 * 7 + 1] * c[7];
+				tmp2a =	in[2 * 2 + 0] * c[2] + in[2 * 4 + 0] * c[4] + ta66 + in[2 * 8 + 0] * c[8];
+				tmp2b =	in[2 * 2 + 1] * c[2] + in[2 * 4 + 1] * c[4] + tb66 + in[2 * 8 + 1] * c[8];
+
+				MACRO1(0);
+				MACRO2(8);
+			}
+
+			{
+				real tmp1a, tmp2a, tmp1b, tmp2b;
+				tmp1a =	(in[2 * 1 + 0] - in[2 * 5 + 0] - in[2 * 7 + 0]) * c[3];
+				tmp1b =	(in[2 * 1 + 1] - in[2 * 5 + 1] - in[2 * 7 + 1]) * c[3];
+				tmp2a =	(in[2 * 2 + 0] - in[2 * 4 + 0] - in[2 * 8 + 0]) * c[6] - in[2 * 6 + 0] + in[2 * 0 + 0];
+				tmp2b =	(in[2 * 2 + 1] - in[2 * 4 + 1] - in[2 * 8 + 1]) * c[6] - in[2 * 6 + 1] + in[2 * 0 + 1];
+
+				MACRO1(1);
+				MACRO2(7);
+			}
+
+			{
+				real tmp1a, tmp2a, tmp1b, tmp2b;
+				tmp1a =	in[2 * 1 + 0] * c[5] - ta33 - in[2 * 5 + 0] * c[7] + in[2 * 7 + 0] * c[1];
+				tmp1b =	in[2 * 1 + 1] * c[5] - tb33 - in[2 * 5 + 1] * c[7] + in[2 * 7 + 1] * c[1];
+				tmp2a =	-in[2 * 2 + 0] * c[8] - in[2 * 4 + 0] * c[2] + ta66 + in[2 * 8 + 0] * c[4];
+				tmp2b =	-in[2 * 2 + 1] * c[8] - in[2 * 4 + 1] * c[2] + tb66 + in[2 * 8 + 1] * c[4];
+
+				MACRO1(2);
+				MACRO2(6);
+			}
+
+			{
+				real tmp1a, tmp2a, tmp1b, tmp2b;
+				tmp1a =	in[2 * 1 + 0] * c[7] - ta33 + in[2 * 5 + 0] * c[1] - in[2 * 7 + 0] * c[5];
+				tmp1b =	in[2 * 1 + 1] * c[7] - tb33 + in[2 * 5 + 1] * c[1] - in[2 * 7 + 1] * c[5];
+				tmp2a =	-in[2 * 2 + 0] * c[4] + in[2 * 4 + 0] * c[8] + ta66 - in[2 * 8 + 0] * c[2];
+				tmp2b =	-in[2 * 2 + 1] * c[4] + in[2 * 4 + 1] * c[8] + tb66 - in[2 * 8 + 1] * c[2];
+
+				MACRO1(3);
+				MACRO2(5);
+			}
+
+			{
+				real sum0, sum1;
+
+				sum0 = in[2 * 0 + 0] - in[2 * 2 + 0] + in[2 * 4 + 0] - in[2 * 6 + 0] + in[2 * 8 + 0];
+				sum1 = (in[2 * 0 + 1] - in[2 * 2 + 1] + in[2 * 4 + 1] - in[2 * 6 + 1] + in[2 * 8 + 1]) * tfcos36[4];
+				MACRO0(4);
+			}
+		}
+#endif
+
+	}
+}
+
+/*
+ * new DCT12
+ */
+static void dct12(real * in, real * rawout1, real * rawout2, register real * wi, register real * ts)
+{
+
+#define DCT12_PART1()				\
+do {						\
+	in5 = in[5*3];				\
+	in5 += (in4 = in[4*3]);			\
+	in4 += (in3 = in[3*3]);			\
+	in3 += (in2 = in[2*3]);			\
+	in2 += (in1 = in[1*3]);			\
+	in1 += (in0 = in[0*3]);			\
+						\
+	in5 += in3; in3 += in1;			\
+						\
+	in2 *= COS6_1;				\
+	in3 *= COS6_1;				\
+} while (0) 
+
+#define DCT12_PART2()				\
+do {						\
+	in0 += in4 * COS6_2;			\
+						\
+	in4 = in0 + in2;			\
+	in0 -= in2;				\
+						\
+	in1 += in5 * COS6_2;			\
+						\
+	in5 = (in1 + in3) * tfcos12[0];		\
+	in1 = (in1 - in3) * tfcos12[2];		\
+						\
+	in3 = in4 + in5;			\
+	in4 -= in5;				\
+						\
+	in2 = in0 + in1;			\
+	in0 -= in1;				\
+} while (0)
+
+
+	{
+		real in0, in1, in2, in3, in4, in5;
+		register real *out1 = rawout1;
+
+		ts[SBLIMIT * 0] = out1[0];
+		ts[SBLIMIT * 1] = out1[1];
+		ts[SBLIMIT * 2] = out1[2];
+		ts[SBLIMIT * 3] = out1[3];
+		ts[SBLIMIT * 4] = out1[4];
+		ts[SBLIMIT * 5] = out1[5];
+
+		DCT12_PART1();
+
+		{
+			real tmp0, tmp1 = (in0 - in4);
+
+			{
+				real tmp2 = (in1 - in5) * tfcos12[1];
+
+				tmp0 = tmp1 + tmp2;
+				tmp1 -= tmp2;
+			}
+			ts[(17 - 1) * SBLIMIT] = out1[17 - 1] + tmp0 * wi[11 - 1];
+			ts[(12 + 1) * SBLIMIT] = out1[12 + 1] + tmp0 * wi[6 + 1];
+			ts[(6 + 1) * SBLIMIT] = out1[6 + 1] + tmp1 * wi[1];
+			ts[(11 - 1) * SBLIMIT] = out1[11 - 1] + tmp1 * wi[5 - 1];
+		}
+
+		DCT12_PART2();
+
+		ts[(17 - 0) * SBLIMIT] = out1[17 - 0] + in2 * wi[11 - 0];
+		ts[(12 + 0) * SBLIMIT] = out1[12 + 0] + in2 * wi[6 + 0];
+		ts[(12 + 2) * SBLIMIT] = out1[12 + 2] + in3 * wi[6 + 2];
+		ts[(17 - 2) * SBLIMIT] = out1[17 - 2] + in3 * wi[11 - 2];
+
+		ts[(6 + 0) * SBLIMIT] = out1[6 + 0] + in0 * wi[0];
+		ts[(11 - 0) * SBLIMIT] = out1[11 - 0] + in0 * wi[5 - 0];
+		ts[(6 + 2) * SBLIMIT] = out1[6 + 2] + in4 * wi[2];
+		ts[(11 - 2) * SBLIMIT] = out1[11 - 2] + in4 * wi[5 - 2];
+	}
+
+	in++;
+
+	{
+		real in0, in1, in2, in3, in4, in5;
+		register real *out2 = rawout2;
+
+		DCT12_PART1();
+
+		{
+			real tmp0, tmp1 = (in0 - in4);
+
+			{
+				real tmp2 = (in1 - in5) * tfcos12[1];
+
+				tmp0 = tmp1 + tmp2;
+				tmp1 -= tmp2;
+			}
+			out2[5 - 1] = tmp0 * wi[11 - 1];
+			out2[0 + 1] = tmp0 * wi[6 + 1];
+			ts[(12 + 1) * SBLIMIT] += tmp1 * wi[1];
+			ts[(17 - 1) * SBLIMIT] += tmp1 * wi[5 - 1];
+		}
+
+		DCT12_PART2();
+
+		out2[5 - 0] = in2 * wi[11 - 0];
+		out2[0 + 0] = in2 * wi[6 + 0];
+		out2[0 + 2] = in3 * wi[6 + 2];
+		out2[5 - 2] = in3 * wi[11 - 2];
+
+		ts[(12 + 0) * SBLIMIT] += in0 * wi[0];
+		ts[(17 - 0) * SBLIMIT] += in0 * wi[5 - 0];
+		ts[(12 + 2) * SBLIMIT] += in4 * wi[2];
+		ts[(17 - 2) * SBLIMIT] += in4 * wi[5 - 2];
+	}
+
+	in++;
+
+	{
+		real in0, in1, in2, in3, in4, in5;
+		register real *out2 = rawout2;
+
+		out2[12] = out2[13] = out2[14] = out2[15] = out2[16] = out2[17] = 0.0;
+
+		DCT12_PART1();
+
+		{
+			real tmp0, tmp1 = (in0 - in4);
+
+			{
+				real tmp2 = (in1 - in5) * tfcos12[1];
+
+				tmp0 = tmp1 + tmp2;
+				tmp1 -= tmp2;
+			}
+			out2[11 - 1] = tmp0 * wi[11 - 1];
+			out2[6 + 1] = tmp0 * wi[6 + 1];
+			out2[0 + 1] += tmp1 * wi[1];
+			out2[5 - 1] += tmp1 * wi[5 - 1];
+		}
+
+		DCT12_PART2();
+
+		out2[11 - 0] = in2 * wi[11 - 0];
+		out2[6 + 0] = in2 * wi[6 + 0];
+		out2[6 + 2] = in3 * wi[6 + 2];
+		out2[11 - 2] = in3 * wi[11 - 2];
+
+		out2[0 + 0] += in0 * wi[0];
+		out2[5 - 0] += in0 * wi[5 - 0];
+		out2[0 + 2] += in4 * wi[2];
+		out2[5 - 2] += in4 * wi[5 - 2];
+	}
+}
+
+/*
+ * III_hybrid
+ */
+static void III_hybrid(real fsIn[SBLIMIT][SSLIMIT],
+		       real tsOut[SSLIMIT][SBLIMIT], int ch,
+		       struct gr_info_s *gr_info, struct frame *fr)
+{
+	static real block[2][2][SBLIMIT * SSLIMIT] = { {{0,}} };
+	static int blc[2] = { 0, 0 };
+
+	real *tspnt = (real *) tsOut;
+	real *rawout1, *rawout2;
+	int bt;
+	unsigned sb = 0;
+
+	{
+		int b = blc[ch];
+		rawout1 = block[b][ch];
+		b = -b + 1;
+		rawout2 = block[b][ch];
+		blc[ch] = b;
+	}
+
+	if (gr_info->mixed_block_flag)
+	{
+		sb = 2;
+#ifdef USE_3DNOW
+	     (fr->dct36)(fsIn[0],rawout1,rawout2,win[0],tspnt);
+	     (fr->dct36)(fsIn[1],rawout1+18,rawout2+18,win1[0],tspnt+1);
+#else
+		dct36(fsIn[0], rawout1, rawout2, win[0], tspnt);
+		dct36(fsIn[1], rawout1 + 18, rawout2 + 18, win1[0], tspnt + 1);
+#endif
+		rawout1 += 36;
+		rawout2 += 36;
+		tspnt += 2;
+	}
+
+	bt = gr_info->block_type;
+	if (bt == 2)
+	{
+		for (; sb < gr_info->maxb; sb += 2, tspnt += 2, rawout1 += 36, rawout2 += 36)
+		{
+			dct12(fsIn[sb], rawout1, rawout2, win[2], tspnt);
+			dct12(fsIn[sb + 1], rawout1 + 18, rawout2 + 18, win1[2], tspnt + 1);
+		}
+	}
+	else
+	{
+		for (; sb < gr_info->maxb; sb += 2, tspnt += 2, rawout1 += 36, rawout2 += 36)
+		{
+#ifdef USE_3DNOW
+			(fr->dct36)(fsIn[sb],rawout1,rawout2,win[bt],tspnt);
+			(fr->dct36)(fsIn[sb+1],rawout1+18,rawout2+18,win1[bt],tspnt+1);
+#else
+			dct36(fsIn[sb], rawout1, rawout2, win[bt], tspnt);
+			dct36(fsIn[sb + 1], rawout1 + 18, rawout2 + 18, win1[bt], tspnt + 1);
+#endif
+		}
+	}
+
+	for (; sb < SBLIMIT; sb++, tspnt++)
+	{
+		int i;
+		for (i = 0; i < SSLIMIT; i++)
+		{
+			tspnt[i * SBLIMIT] = *rawout1++;
+			*rawout2++ = 0.0;
+		}
+	}
+}
+
+/*
+ * main layer3 handler
+ */
+int mpg123_do_layer3(struct frame *fr)
+{
+	int gr, ch, ss;
+	int scalefacs[2][39];	/* max 39 for short[13][3] mode, mixed: 38, long: 22 */
+	struct III_sideinfo sideinfo;
+	int stereo = fr->stereo;
+	int single = fr->single;
+	int ms_stereo, i_stereo;
+	int sfreq = fr->sampling_frequency;
+	int stereo1, granules;
+
+	if (stereo == 1)
+	{			/* stream is mono */
+		stereo1 = 1;
+		single = 0;
+	}
+	else if (single >= 0)	/* stream is stereo, but force to mono */
+		stereo1 = 1;
+	else
+		stereo1 = 2;
+
+	if (fr->mode == MPG_MD_JOINT_STEREO)
+	{
+		ms_stereo = (fr->mode_ext & 0x2) >> 1;
+		i_stereo = fr->mode_ext & 0x1;
+	}
+	else
+		ms_stereo = i_stereo = 0;
+
+	granules = fr->lsf ? 1 : 2;
+	if (!III_get_side_info(&sideinfo, stereo, ms_stereo, sfreq, single, fr->lsf))
+		return 0;
+
+	mpg123_set_pointer(sideinfo.main_data_begin);
+
+	for (gr = 0; gr < granules; gr++)
+	{
+		real hybridIn[2][SBLIMIT][SSLIMIT];
+		real hybridOut[2][SSLIMIT][SBLIMIT];
+
+		{
+			struct gr_info_s *gr_info = &(sideinfo.ch[0].gr[gr]);
+			long part2bits;
+
+			if (fr->lsf)
+				part2bits = III_get_scale_factors_2(scalefacs[0], gr_info, 0);
+			else
+				part2bits = III_get_scale_factors_1(scalefacs[0], gr_info);
+
+			if (III_dequantize_sample(hybridIn[0], scalefacs[0], gr_info, sfreq, part2bits))
+				return 0;
+		}
+
+		if (stereo == 2)
+		{
+			struct gr_info_s *gr_info = &(sideinfo.ch[1].gr[gr]);
+			long part2bits;
+
+			if (fr->lsf)
+				part2bits = III_get_scale_factors_2(scalefacs[1], gr_info, i_stereo);
+			else
+				part2bits = III_get_scale_factors_1(scalefacs[1], gr_info);
+
+			if (III_dequantize_sample(hybridIn[1], scalefacs[1], gr_info, sfreq, part2bits))
+				return 0;
+
+			if (ms_stereo)
+			{
+				int i;
+				unsigned maxb = sideinfo.ch[0].gr[gr].maxb;
+
+				if (sideinfo.ch[1].gr[gr].maxb > maxb)
+					maxb = sideinfo.ch[1].gr[gr].maxb;
+				for (i = 0; i < SSLIMIT * maxb; i++)
+				{
+					real tmp0 = ((real *) hybridIn[0])[i];
+					real tmp1 = ((real *) hybridIn[1])[i];
+					((real *) hybridIn[0])[i] = tmp0 + tmp1;
+					((real *) hybridIn[1])[i] = tmp0 - tmp1;
+				}
+			}
+
+			if (i_stereo)
+				III_i_stereo(hybridIn, scalefacs[1], gr_info, sfreq, ms_stereo, fr->lsf);
+
+			if (ms_stereo || i_stereo || (single == 3))
+			{
+				if (gr_info->maxb > sideinfo.ch[0].gr[gr].maxb)
+					sideinfo.ch[0].gr[gr].maxb = gr_info->maxb;
+				else
+					gr_info->maxb = sideinfo.ch[0].gr[gr].maxb;
+			}
+
+			switch (single)
+			{
+				case 3:
+					{
+						register unsigned i;
+						register real *in0 = (real *) hybridIn[0],
+							*in1 = (real *) hybridIn[1];
+						for (i = 0; i < SSLIMIT * gr_info->maxb; 	     i++, in0++)
+							*in0 = (*in0 + *in1++);	/* *0.5 done by pow-scale */
+					}
+					break;
+				case 1:
+					{
+						register unsigned i;
+						register real *in0 = (real *) hybridIn[0],
+							*in1 = (real *) hybridIn[1];
+						for (i = 0; i < SSLIMIT * gr_info->maxb; i++)
+							*in0++ = *in1++;
+					}
+					break;
+			}
+		}
+/***
+		if (mpg123_info->eq_active)
+		{
+			int i, sb;
+
+			if (single < 0)
+			{
+				for (sb = 0, i = 0; sb < SBLIMIT; sb++)
+				{
+					for (ss = 0; ss < SSLIMIT; ss++)
+					{
+						hybridIn[0][sb][ss] *= mpg123_info->eq_mul[i];
+						hybridIn[1][sb][ss] *= mpg123_info->eq_mul[i++];
+					}
+				}
+			}
+			else
+			{
+				for (sb = 0, i = 0; sb < SBLIMIT; sb++)
+				{
+					for (ss = 0; ss < SSLIMIT; ss++)
+						hybridIn[0][sb][ss] *= mpg123_info->eq_mul[i++];
+				}
+			}
+		}
+***/
+
+		for (ch = 0; ch < stereo1; ch++)
+		{
+			struct gr_info_s *gr_info = &(sideinfo.ch[ch].gr[gr]);
+
+			III_antialias(hybridIn[ch], gr_info);
+			if (gr_info->maxb < 1 || gr_info->maxb > SBLIMIT)
+				return 0;
+			III_hybrid(hybridIn[ch], hybridOut[ch], ch, gr_info, fr);
+		}
+
+		for (ss = 0; ss < SSLIMIT; ss++)
+		{
+			if (single >= 0)
+			{
+				(fr->synth_mono) (hybridOut[0][ss], mpg123_pcm_sample, &mpg123_pcm_point);
+			}
+			else
+			{
+				int p1 = mpg123_pcm_point;
+
+				(fr->synth) (hybridOut[0][ss], 0, mpg123_pcm_sample, &p1);
+				(fr->synth) (hybridOut[1][ss], 1, mpg123_pcm_sample, &mpg123_pcm_point);
+			}
+		}
+
+/***
+		if (mpg123_info->output_audio)
+		{
+			mpg123_ip.add_vis_pcm(mpg123_ip.output->written_time(),
+					      mpg123_cfg.resolution == 16 ? FMT_S16_NE : FMT_U8,
+					      mpg123_cfg.channels == 2 ? fr->stereo : 1,
+					      mpg123_pcm_point, mpg123_pcm_sample);
+			while (mpg123_ip.output->buffer_free() < mpg123_pcm_point &&
+			       mpg123_info->going && mpg123_info->jump_to_time == -1)
+				xmms_usleep(10000);
+			if (mpg123_info->going && mpg123_info->jump_to_time == -1)
+				mpg123_ip.output->write_audio(mpg123_pcm_sample, mpg123_pcm_point);
+		}
+***/
+		mpg123_pcm_point = 0;
+	}
+	return 1;
+}