summary refs log tree commit diff
path: root/src/Vorbis.c
diff options
context:
space:
mode:
authorWlodekM <[email protected]>2024-06-16 10:35:45 +0300
committerWlodekM <[email protected]>2024-06-16 10:35:45 +0300
commitabef6da56913f1c55528103e60a50451a39628b1 (patch)
treeb3c8092471ecbb73e568cd0d336efa0e7871ee8d /src/Vorbis.c
initial commit
Diffstat (limited to 'src/Vorbis.c')
-rw-r--r--src/Vorbis.c1674
1 files changed, 1674 insertions, 0 deletions
diff --git a/src/Vorbis.c b/src/Vorbis.c
new file mode 100644
index 0000000..7d00688
--- /dev/null
+++ b/src/Vorbis.c
@@ -0,0 +1,1674 @@
+#include "Vorbis.h"
+#include "Logger.h"
+#include "Platform.h"
+#include "Event.h"
+#include "ExtMath.h"
+#include "Funcs.h"
+#include "Errors.h"
+#include "Stream.h"
+
+/*########################################################################################################################*
+*-------------------------------------------------------Ogg stream--------------------------------------------------------*
+*#########################################################################################################################*/
+#define OGG_FourCC(a, b, c, d) (((cc_uint32)a << 24) | ((cc_uint32)b << 16) | ((cc_uint32)c << 8) | (cc_uint32)d)
+/* See https://xiph.org/ogg/ */
+
+static void Ogg_DiscardPacket(struct OggState* ctx) {
+	ctx->cur += ctx->left;
+	ctx->left = 0;
+}
+
+static void Ogg_NextPacket(struct OggState* ctx) {
+	cc_uint8 part;
+	ctx->left = 0;
+
+	for (; ctx->segmentsRead < ctx->numSegments; ) {
+		part = ctx->segments[ctx->segmentsRead++];
+		ctx->left += part;
+		if (part != 255) break; /* end of this packet */
+	}
+}
+
+static cc_result Ogg_NextPage(struct OggState* ctx) {
+	cc_uint8 header[27];
+	struct Stream* source;
+	cc_uint32 sig, size;
+	cc_result res;
+	int i;
+
+	/* OGG page format:
+	* header[0]  (4) page signature
+	* header[4]  (1) page version
+	* header[5]  (1) page flags
+	* header[6]  (8) granule position
+	* header[14] (4) serial number
+	* header[18] (4) page sequence number
+	* header[22] (4) page checksum
+	* header[26] (1) number of segments
+	* [number of segments] number of bytes in each segment
+	* [sum of bytes in each segment] page data
+	*/
+	/* An OGG page is then further split into one or more packets */
+	source = ctx->source;
+	if ((res = Stream_Read(source, header, sizeof(header)))) return res;
+
+	sig = Stream_GetU32_BE(&header[0]);
+	if (sig == OGG_FourCC('I','D','3', 2))  return AUDIO_ERR_MP3_SIG; /* ID3 v2.2 tags header */
+	if (sig == OGG_FourCC('I','D','3', 3))  return AUDIO_ERR_MP3_SIG; /* ID3 v2.3 tags header */
+	if (sig != OGG_FourCC('O','g','g','S')) return OGG_ERR_INVALID_SIG;
+	if (header[4] != 0) return OGG_ERR_VERSION;
+
+	ctx->segmentsRead = 0;
+	ctx->numSegments  = header[26];
+	if ((res = Stream_Read(source, ctx->segments, ctx->numSegments))) return res;
+
+	size = 0;
+	for (i = 0; i < ctx->numSegments; i++) size += ctx->segments[i];
+	if ((res = Stream_Read(source, ctx->buffer, size))) return res;
+
+	ctx->cur  = ctx->buffer;
+	ctx->last = header[5] & 4;
+	Ogg_NextPacket(ctx);
+	return 0;
+}
+
+static cc_result Ogg_Read(struct OggState* ctx, cc_uint8* data, cc_uint32 count) {
+	cc_uint32 left = count;
+	cc_result res;
+	while (left) {
+		if (ctx->left) {
+			count = min(left, ctx->left);
+			Mem_Copy(data, ctx->cur, count);
+
+			ctx->cur  += count;
+			ctx->left -= count;
+			left      -= count;
+		} else if (ctx->segmentsRead < ctx->numSegments) {
+			Ogg_NextPacket(ctx);
+		} else {
+			if (ctx->last) return ERR_END_OF_STREAM;
+			if ((res = Ogg_NextPage(ctx))) return res;
+		}
+	}
+	return 0;
+}
+
+static cc_result Ogg_Skip(struct OggState* ctx, cc_uint32 count) {
+	cc_uint8 tmp[3584]; /* not quite 4 KB to avoid chkstk call */
+	cc_uint32 left = count;
+	cc_result res;
+
+	/* TODO: Should Ogg_Read be duplicated here to avoid Mem_Copy call? */
+	/* Probably not worth it considering how small comments are */
+	while (left) {
+		count = min(left, sizeof(tmp));
+		if ((res = Ogg_Read(ctx, tmp, count))) return res;
+		left -= count;
+	}
+	return 0;
+}
+
+static cc_result Ogg_ReadU8(struct OggState* ctx, cc_uint8* data) {
+	/* The fast path below almost always gets used */
+	if (!ctx->left) return Ogg_Read(ctx, data, 1);
+
+	*data = *ctx->cur;
+	ctx->cur++;
+	ctx->left--;
+	return 0;
+}
+
+static cc_result Ogg_ReadU32(struct OggState* ctx, cc_uint32* value) {
+	cc_uint8 data[4]; cc_result res;
+	if ((res = Ogg_Read(ctx, data, 4))) return res;
+	*value = Stream_GetU32_LE(data); return 0;
+}
+
+void Ogg_Init(struct OggState* ctx, struct Stream* source) {
+	ctx->cur  = ctx->buffer;
+	ctx->left = 0;
+	ctx->last = 0;
+	ctx->source = source;
+	ctx->segmentsRead = 0;
+	ctx->numSegments  = 0;
+}
+
+
+/*########################################################################################################################*
+*------------------------------------------------------Vorbis utils-------------------------------------------------------*
+*#########################################################################################################################*/
+#define Vorbis_PushByte(ctx, value) ctx->Bits |= (cc_uint32)(value) << ctx->NumBits; ctx->NumBits += 8;
+#define Vorbis_PeekBits(ctx, bits) (ctx->Bits & ((1UL << (bits)) - 1UL))
+#define Vorbis_ConsumeBits(ctx, bits) ctx->Bits >>= (bits); ctx->NumBits -= (bits);
+/* Aligns bit buffer to be on a byte boundary */
+#define Vorbis_AlignBits(ctx) alignSkip = ctx->NumBits & 7; Vorbis_ConsumeBits(ctx, alignSkip);
+/* See https://xiph.org/vorbis/doc/Vorbis_I_spec.html */
+
+/* TODO: Make sure this is inlined */
+static cc_uint32 Vorbis_ReadBits(struct VorbisState* ctx, cc_uint32 bitsCount) {
+	cc_uint8 portion;
+	cc_uint32 data;
+	cc_result res;
+
+	while (ctx->NumBits < bitsCount) {
+		res = Ogg_ReadU8(ctx->source, &portion);
+		if (res) { Logger_Abort2(res, "Failed to read byte for vorbis"); }
+		Vorbis_PushByte(ctx, portion);
+	}
+
+	data = Vorbis_PeekBits(ctx, bitsCount); Vorbis_ConsumeBits(ctx, bitsCount);
+	return data;
+}
+
+static cc_result Vorbis_TryReadBits(struct VorbisState* ctx, cc_uint32 bitsCount, cc_uint32* data) {
+	cc_uint8 portion;
+	cc_result res;
+
+	while (ctx->NumBits < bitsCount) {
+		res = Ogg_ReadU8(ctx->source, &portion);
+		if (res) return res;
+		Vorbis_PushByte(ctx, portion);
+	}
+
+	*data = Vorbis_PeekBits(ctx, bitsCount); Vorbis_ConsumeBits(ctx, bitsCount);
+	return 0;
+}
+
+static cc_uint32 Vorbis_ReadBit(struct VorbisState* ctx) {
+	cc_uint8 portion;
+	cc_uint32 data;
+	cc_result res;
+
+	if (!ctx->NumBits) {
+		res = Ogg_ReadU8(ctx->source, &portion);
+		if (res) { Logger_Abort2(res, "Failed to read byte for vorbis"); }
+		Vorbis_PushByte(ctx, portion);
+	}
+
+	data = Vorbis_PeekBits(ctx, 1); Vorbis_ConsumeBits(ctx, 1);
+	return data;
+}
+
+
+/* Vorbis spec 9.2.1. ilog */
+static int iLog(int x) {
+	int bits = 0;
+	while (x > 0) { bits++; x >>= 1; }
+	return bits;
+}
+
+/* https://en.wikipedia.org/wiki/Single-precision_floating-point_format */
+/* Float consists of: */
+/* - 1 bit for sign */
+/* - 8 bits for biased exponent */
+/* - 23 bits for mantissa */
+#define FLT_SIGN_MASK      0x80000000
+#define FLT_EXPONENT_BIAS  127
+#define FLT_EXPONENT_SHIFT 23
+#define FLT_EXPONENT_MASK  0x7F800000
+#define FLT_MANTISSA_MASK  0x007FFFFF
+
+/* returns m * 2^exp */
+static float Fast_ldexpf(int m, int exp) {
+	union IntAndFloat raw;
+	int e;
+	raw.f = m;
+
+	e  = (raw.i & FLT_EXPONENT_MASK) >> FLT_EXPONENT_SHIFT;
+	e -= FLT_EXPONENT_BIAS;
+	e += exp;
+
+	/* Treat denormal exponents as just +-0 */
+	if (e < -126) return m < 0 ? -0.0f : 0.0f;
+	/* Treat large exponents as infinity */
+	if (e >  128) e = 128;
+	e += FLT_EXPONENT_BIAS;
+
+	raw.i = (e << FLT_EXPONENT_SHIFT) | (raw.i & (FLT_MANTISSA_MASK | FLT_SIGN_MASK));
+	return raw.f;
+}
+
+/* Vorbis spec 9.2.2. float32_unpack */
+static float float32_unpack(struct VorbisState* ctx) {
+	/* ReadBits can't reliably read over 24 bits */
+	cc_uint32 lo = Vorbis_ReadBits(ctx, 16);
+	cc_uint32 hi = Vorbis_ReadBits(ctx, 16);
+	cc_uint32 x = (hi << 16) | lo;
+
+	cc_int32 mantissa  =  x & 0x1fffff;
+	cc_uint32 exponent = (x & 0x7fe00000) >> 21;
+	if (x & 0x80000000UL) mantissa = -mantissa;
+
+	return Fast_ldexpf(mantissa, (int)exponent - 788);
+}
+
+
+/*########################################################################################################################*
+*----------------------------------------------------Vorbis codebooks-----------------------------------------------------*
+*#########################################################################################################################*/
+/* Vorbis spec 3. Probability Model and Codebooks */
+#define CODEBOOK_SYNC 0x564342
+
+struct Codebook {
+	cc_uint32 dimensions, entries, totalCodewords;
+	cc_uint32* codewords;
+	cc_uint32* values;
+	cc_uint32 numCodewords[33]; /* number of codewords of bit length i */
+	/* vector quantisation values */
+	float minValue, deltaValue;
+	cc_uint32 sequenceP, lookupType, lookupValues;
+	cc_uint16* multiplicands;
+};
+
+static void Codebook_Free(struct Codebook* c) {
+	Mem_Free(c->codewords);
+	Mem_Free(c->values);
+	Mem_Free(c->multiplicands);
+}
+
+static cc_uint32 Codebook_Pow(cc_uint32 base, cc_uint32 exp) {
+	cc_uint32 result = 1; /* exponentiation by squaring */
+	while (exp) {
+		if (exp & 1) result *= base;
+		exp >>= 1;
+		base *= base;
+	}
+	return result;
+}
+
+static cc_uint32 Codebook_Lookup1Values(cc_uint32 entries, cc_uint32 dimensions) {
+	cc_uint32 i, pow, next;
+	/* the greatest integer value for which [value] to the power of [dimensions] is less than or equal to [entries] */
+	/* TODO: verify this */
+	for (i = 1; ; i++) 
+	{
+		pow  = Codebook_Pow(i,     dimensions);
+		next = Codebook_Pow(i + 1, dimensions);
+
+		if (next < pow)     return i; /* overflow */
+		if (pow == entries) return i;
+		if (next > entries) return i;
+	}
+	return 0;
+}
+
+static cc_bool Codebook_CalcCodewords(struct Codebook* c, cc_uint8* len) {
+	/* This is taken from stb_vorbis.c because I gave up trying */
+	cc_uint32 i, depth;
+	cc_uint32 root, codeword;
+	cc_uint32 next_codewords[33] = { 0 };
+	int offset;
+	int len_offsets[33];
+
+	c->codewords = (cc_uint32*)Mem_Alloc(c->totalCodewords, 4, "codewords");
+	c->values    = (cc_uint32*)Mem_Alloc(c->totalCodewords, 4, "values");
+
+	/* Codeword entries are ordered by length */
+	offset = 0;
+	for (i = 0; i < Array_Elems(len_offsets); i++) 
+	{
+		len_offsets[i] = offset;
+		offset += c->numCodewords[i];
+	}
+
+	/* add codeword 0 to tree */
+	for (i = 0; i < c->entries; i++) 
+	{
+		if (!len[i]) continue;
+		offset = len_offsets[len[i]];
+
+		c->codewords[offset] = 0;
+		c->values[offset]    = i;
+
+		len_offsets[len[i]]++;
+		break;
+	}
+
+	/* set codewords that new nodes can start from */
+	for (depth = 1; depth <= len[i]; depth++) 
+	{
+		next_codewords[depth] = 1U << (32 - depth);
+	}
+
+	i++; /* first codeword was already handled */
+	for (; i < c->entries; i++) 
+	{
+		root = len[i];
+		if (!root) continue;
+		offset = len_offsets[len[i]];
+
+		/* per spec, find lowest possible value (leftmost) */
+		while (root && next_codewords[root] == 0) root--;
+		if (root == 0) return false;
+
+		codeword = next_codewords[root];
+		next_codewords[root] = 0;
+
+		c->codewords[offset] = codeword;
+		c->values[offset]    = i;
+
+		for (depth = len[i]; depth > root; depth--) 
+		{
+			next_codewords[depth] = codeword + (1U << (32 - depth));
+		}
+
+		len_offsets[len[i]]++;
+	}
+	return true;
+}
+
+static cc_result Codebook_DecodeSetup(struct VorbisState* ctx, struct Codebook* c) {
+	cc_uint32 sync;
+	cc_uint8* codewordLens;
+	int i, entry;
+	int sparse, len;
+	int runBits, runLen;
+	int valueBits;
+	cc_uint32 lookupValues;
+
+	sync = Vorbis_ReadBits(ctx, 24);
+	if (sync != CODEBOOK_SYNC) return VORBIS_ERR_CODEBOOK_SYNC;
+	c->dimensions = Vorbis_ReadBits(ctx, 16);
+	c->entries    = Vorbis_ReadBits(ctx, 24);
+
+	codewordLens = (cc_uint8*)Mem_Alloc(c->entries, 1, "raw codeword lens");
+	for (i = 0; i < Array_Elems(c->numCodewords); i++) 
+	{
+		c->numCodewords[i] = 0;
+	}
+
+	/* ordered entries flag */
+	if (!Vorbis_ReadBit(ctx)) {
+		sparse = Vorbis_ReadBit(ctx);
+		entry  = 0;
+		for (i = 0; i < c->entries; i++) 
+		{
+			/* sparse trees may not have all entries */
+			if (sparse && !Vorbis_ReadBit(ctx)){
+				codewordLens[i] = 0;
+				continue; /* unused entry */
+			}
+
+			len = Vorbis_ReadBits(ctx, 5) + 1;
+			codewordLens[i] = len;
+			c->numCodewords[len]++;
+			entry++;
+		}
+	} else {
+		len = Vorbis_ReadBits(ctx, 5) + 1;
+		for (entry = 0; entry < c->entries;) 
+		{
+			runBits = iLog(c->entries - entry);
+			runLen  = Vorbis_ReadBits(ctx, runBits);
+
+			/* handle corrupted ogg files */
+			if (entry + runLen > c->entries) return VORBIS_ERR_CODEBOOK_ENTRY;
+
+			for (i = 0; i < runLen; i++) { codewordLens[entry++] = len; }
+			c->numCodewords[len++] = runLen;
+		}
+	}
+
+	c->totalCodewords = entry;
+	Codebook_CalcCodewords(c, codewordLens);
+	Mem_Free(codewordLens);
+
+	c->lookupType    = Vorbis_ReadBits(ctx, 4);
+	c->multiplicands = NULL;
+	if (c->lookupType == 0) return 0;
+	if (c->lookupType > 2)  return VORBIS_ERR_CODEBOOK_LOOKUP;
+
+	c->minValue   = float32_unpack(ctx);
+	c->deltaValue = float32_unpack(ctx);
+	valueBits     = Vorbis_ReadBits(ctx, 4) + 1;
+	c->sequenceP  = Vorbis_ReadBit(ctx);
+
+	if (c->lookupType == 1) {
+		lookupValues = Codebook_Lookup1Values(c->entries, c->dimensions);
+	} else {
+		lookupValues = c->entries * c->dimensions;
+	}
+	c->lookupValues = lookupValues;
+
+	c->multiplicands = (cc_uint16*)Mem_Alloc(lookupValues, 2, "multiplicands");
+	for (i = 0; i < lookupValues; i++) 
+	{
+		c->multiplicands[i] = Vorbis_ReadBits(ctx, valueBits);
+	}
+	return 0;
+}
+
+static cc_uint32 Codebook_DecodeScalar(struct VorbisState* ctx, struct Codebook* c) {
+	cc_uint32 codeword = 0, shift = 31, depth, i;
+	cc_uint32* codewords = c->codewords;
+	cc_uint32* values    = c->values;
+
+	/* TODO: This is so massively slow */
+	for (depth = 1; depth <= 32; depth++, shift--) 
+	{
+		codeword |= Vorbis_ReadBit(ctx) << shift;
+
+		for (i = 0; i < c->numCodewords[depth]; i++) 
+		{
+			if (codeword != codewords[i]) continue;
+			return values[i];
+		}
+
+		codewords += c->numCodewords[depth];
+		values    += c->numCodewords[depth];
+	}
+	Logger_Abort("Invalid huffman code");
+	return -1;
+}
+
+static void Codebook_DecodeVectors(struct VorbisState* ctx, struct Codebook* c, float* v, int step) {
+	cc_uint32 lookupOffset = Codebook_DecodeScalar(ctx, c);
+	float last = 0.0f, value;
+	cc_uint32 i, offset;
+
+	if (c->lookupType == 1) {		
+		cc_uint32 indexDivisor = 1;
+		for (i = 0; i < c->dimensions; i++, v += step) 
+		{
+			offset = (lookupOffset / indexDivisor) % c->lookupValues;
+			value  = c->multiplicands[offset] * c->deltaValue + c->minValue + last;
+
+			*v += value;
+			if (c->sequenceP) last = value;
+			indexDivisor *= c->lookupValues;
+		}
+	} else if (c->lookupType == 2) {
+		offset = lookupOffset * c->dimensions;
+		for (i = 0; i < c->dimensions; i++, offset++, v += step) 
+		{
+			value  = c->multiplicands[offset] * c->deltaValue + c->minValue + last;
+
+			*v += value;
+			if (c->sequenceP) last = value;
+		}
+	} else {
+		Logger_Abort("Invalid huffman code");
+	}
+}
+
+/*########################################################################################################################*
+*-----------------------------------------------------Vorbis floors-------------------------------------------------------*
+*#########################################################################################################################*/
+#define FLOOR_MAX_PARTITIONS 32
+#define FLOOR_MAX_CLASSES 16
+#define FLOOR_MAX_VALUES (FLOOR_MAX_PARTITIONS * 8 + 2)
+struct Floor {
+	cc_uint8 partitions, multiplier; int range, values;
+	cc_uint8 partitionClasses[FLOOR_MAX_PARTITIONS];
+	cc_uint8 classDimensions[FLOOR_MAX_CLASSES];
+	cc_uint8 classSubClasses[FLOOR_MAX_CLASSES];
+	cc_uint8 classMasterbooks[FLOOR_MAX_CLASSES];
+	cc_int16 subclassBooks[FLOOR_MAX_CLASSES][8];
+	cc_int16  xList[FLOOR_MAX_VALUES];
+	cc_uint16 listOrder[FLOOR_MAX_VALUES];
+	cc_int32  yList[VORBIS_MAX_CHANS][FLOOR_MAX_VALUES];
+};
+
+/* Vorbis spec 10.1. floor1_inverse_dB_table */
+static const float floor1_inverse_dB_table[256] = {
+	1.0649863e-07f, 1.1341951e-07f, 1.2079015e-07f, 1.2863978e-07f, 1.3699951e-07f, 1.4590251e-07f, 1.5538408e-07f, 1.6548181e-07f,
+	1.7623575e-07f, 1.8768855e-07f, 1.9988561e-07f, 2.1287530e-07f, 2.2670913e-07f, 2.4144197e-07f, 2.5713223e-07f, 2.7384213e-07f,
+	2.9163793e-07f, 3.1059021e-07f, 3.3077411e-07f, 3.5226968e-07f, 3.7516214e-07f, 3.9954229e-07f, 4.2550680e-07f, 4.5315863e-07f,
+	4.8260743e-07f, 5.1396998e-07f, 5.4737065e-07f, 5.8294187e-07f, 6.2082472e-07f, 6.6116941e-07f, 7.0413592e-07f, 7.4989464e-07f,
+	7.9862701e-07f, 8.5052630e-07f, 9.0579828e-07f, 9.6466216e-07f, 1.0273513e-06f, 1.0941144e-06f, 1.1652161e-06f, 1.2409384e-06f,
+	1.3215816e-06f, 1.4074654e-06f, 1.4989305e-06f, 1.5963394e-06f, 1.7000785e-06f, 1.8105592e-06f, 1.9282195e-06f, 2.0535261e-06f,
+	2.1869758e-06f, 2.3290978e-06f, 2.4804557e-06f, 2.6416497e-06f, 2.8133190e-06f, 2.9961443e-06f, 3.1908506e-06f, 3.3982101e-06f,
+	3.6190449e-06f, 3.8542308e-06f, 4.1047004e-06f, 4.3714470e-06f, 4.6555282e-06f, 4.9580707e-06f, 5.2802740e-06f, 5.6234160e-06f,
+	5.9888572e-06f, 6.3780469e-06f, 6.7925283e-06f, 7.2339451e-06f, 7.7040476e-06f, 8.2047000e-06f, 8.7378876e-06f, 9.3057248e-06f,
+	9.9104632e-06f, 1.0554501e-05f, 1.1240392e-05f, 1.1970856e-05f, 1.2748789e-05f, 1.3577278e-05f, 1.4459606e-05f, 1.5399272e-05f,
+	1.6400004e-05f, 1.7465768e-05f, 1.8600792e-05f, 1.9809576e-05f, 2.1096914e-05f, 2.2467911e-05f, 2.3928002e-05f, 2.5482978e-05f,
+	2.7139006e-05f, 2.8902651e-05f, 3.0780908e-05f, 3.2781225e-05f, 3.4911534e-05f, 3.7180282e-05f, 3.9596466e-05f, 4.2169667e-05f,
+	4.4910090e-05f, 4.7828601e-05f, 5.0936773e-05f, 5.4246931e-05f, 5.7772202e-05f, 6.1526565e-05f, 6.5524908e-05f, 6.9783085e-05f,
+	7.4317983e-05f, 7.9147585e-05f, 8.4291040e-05f, 8.9768747e-05f, 9.5602426e-05f, 0.00010181521f, 0.00010843174f, 0.00011547824f,
+	0.00012298267f, 0.00013097477f, 0.00013948625f, 0.00014855085f, 0.00015820453f, 0.00016848555f, 0.00017943469f, 0.00019109536f,
+	0.00020351382f, 0.00021673929f, 0.00023082423f, 0.00024582449f, 0.00026179955f, 0.00027881276f, 0.00029693158f, 0.00031622787f,
+	0.00033677814f, 0.00035866388f, 0.00038197188f, 0.00040679456f, 0.00043323036f, 0.00046138411f, 0.00049136745f, 0.00052329927f,
+	0.00055730621f, 0.00059352311f, 0.00063209358f, 0.00067317058f, 0.00071691700f, 0.00076350630f, 0.00081312324f, 0.00086596457f,
+	0.00092223983f, 0.00098217216f, 0.0010459992f,  0.0011139742f,  0.0011863665f,  0.0012634633f,  0.0013455702f,  0.0014330129f,
+	0.0015261382f,  0.0016253153f,  0.0017309374f,  0.0018434235f,  0.0019632195f,  0.0020908006f,  0.0022266726f,  0.0023713743f,
+	0.0025254795f,  0.0026895994f,  0.0028643847f,  0.0030505286f,  0.0032487691f,  0.0034598925f,  0.0036847358f,  0.0039241906f,
+	0.0041792066f,  0.0044507950f,  0.0047400328f,  0.0050480668f,  0.0053761186f,  0.0057254891f,  0.0060975636f,  0.0064938176f,
+	0.0069158225f,  0.0073652516f,  0.0078438871f,  0.0083536271f,  0.0088964928f,  0.009474637f,   0.010090352f,   0.010746080f,
+	0.011444421f,   0.012188144f,   0.012980198f,   0.013823725f,   0.014722068f,   0.015678791f,   0.016697687f,   0.017782797f,
+	0.018938423f,   0.020169149f,   0.021479854f,   0.022875735f,   0.024362330f,   0.025945531f,   0.027631618f,   0.029427276f,
+	0.031339626f,   0.033376252f,   0.035545228f,   0.037855157f,   0.040315199f,   0.042935108f,   0.045725273f,   0.048696758f,
+	0.051861348f,   0.055231591f,   0.058820850f,   0.062643361f,   0.066714279f,   0.071049749f,   0.075666962f,   0.080584227f,
+	0.085821044f,   0.091398179f,   0.097337747f,   0.10366330f,    0.11039993f,    0.11757434f,    0.12521498f,    0.13335215f,
+	0.14201813f,    0.15124727f,    0.16107617f,    0.17154380f,    0.18269168f,    0.19456402f,    0.20720788f,    0.22067342f,
+	0.23501402f,    0.25028656f,    0.26655159f,    0.28387361f,    0.30232132f,    0.32196786f,    0.34289114f,    0.36517414f,
+	0.38890521f,    0.41417847f,    0.44109412f,    0.46975890f,    0.50028648f,    0.53279791f,    0.56742212f,    0.60429640f,
+	0.64356699f,    0.68538959f,    0.72993007f,    0.77736504f,    0.82788260f,    0.88168307f,    0.9389798f,     1.00000000f,
+};
+
+/* TODO: Make this thread safe */
+static cc_int16* tmp_xlist;
+static cc_uint16* tmp_order;
+static void Floor_SortXList(int left, int right) {
+	cc_uint16* values = tmp_order; cc_uint16 value;
+	cc_int16* keys = tmp_xlist;    cc_int16 key;
+
+	while (left < right) {
+		int i = left, j = right;
+		cc_int16 pivot = keys[(i + j) >> 1];
+
+		/* partition the list */
+		while (i <= j) {
+			while (pivot > keys[i]) i++;
+			while (pivot < keys[j]) j--;
+			QuickSort_Swap_KV_Maybe();
+		}
+		/* recurse into the smaller subset */
+		QuickSort_Recurse(Floor_SortXList)
+	}
+}
+
+static cc_result Floor_DecodeSetup(struct VorbisState* ctx, struct Floor* f) {
+	static const short ranges[4] = { 256, 128, 84, 64 };
+	int i, j, idx, maxClass;
+	int rangeBits, classNum;
+	cc_int16 xlist_sorted[FLOOR_MAX_VALUES];
+
+	f->partitions = Vorbis_ReadBits(ctx, 5);
+	maxClass = -1;
+	for (i = 0; i < f->partitions; i++) 
+	{
+		f->partitionClasses[i] = Vorbis_ReadBits(ctx, 4);
+		maxClass = max(maxClass, f->partitionClasses[i]);
+	}
+
+	for (i = 0; i <= maxClass; i++) 
+	{
+		f->classDimensions[i] = Vorbis_ReadBits(ctx, 3) + 1;
+		f->classSubClasses[i] = Vorbis_ReadBits(ctx, 2);
+
+		if (f->classSubClasses[i]) {
+			f->classMasterbooks[i] = Vorbis_ReadBits(ctx, 8);
+		}
+		for (j = 0; j < (1 << f->classSubClasses[i]); j++) 
+		{
+			f->subclassBooks[i][j] = (cc_int16)Vorbis_ReadBits(ctx, 8) - 1;
+		}
+	}
+
+	f->multiplier = Vorbis_ReadBits(ctx, 2) + 1;
+	f->range      = ranges[f->multiplier - 1];
+	rangeBits     = Vorbis_ReadBits(ctx, 4);
+
+	f->xList[0] = 0;
+	f->xList[1] = 1 << rangeBits;
+	for (i = 0, idx = 2; i < f->partitions; i++) 
+	{
+		classNum = f->partitionClasses[i];
+
+		for (j = 0; j < f->classDimensions[classNum]; j++) 
+		{
+			f->xList[idx++] = Vorbis_ReadBits(ctx, rangeBits);
+		}
+	}
+	f->values = idx;
+
+	/* sort X list for curve computation later */
+	Mem_Copy(xlist_sorted, f->xList, idx * 2);
+	for (i = 0; i < idx; i++) { f->listOrder[i] = i; }
+
+	tmp_xlist = xlist_sorted; 
+	tmp_order = f->listOrder;
+	Floor_SortXList(0, idx - 1);
+	return 0;
+}
+
+static cc_bool Floor_DecodeFrame(struct VorbisState* ctx, struct Floor* f, int ch) {
+	cc_int32* yList;
+	int i, j, idx, rangeBits;
+	cc_uint8 klass, cdim, cbits;
+	int bookNum;
+	cc_uint32 csub, cval;
+
+	/* does this frame have any energy */
+	if (!Vorbis_ReadBit(ctx)) return false;
+	yList = f->yList[ch];
+
+	rangeBits = iLog(f->range - 1);
+	yList[0]  = Vorbis_ReadBits(ctx, rangeBits);
+	yList[1]  = Vorbis_ReadBits(ctx, rangeBits);
+
+	for (i = 0, idx = 2; i < f->partitions; i++) 
+	{
+		klass = f->partitionClasses[i];
+		cdim  = f->classDimensions[klass];
+		cbits = f->classSubClasses[klass];
+
+		csub = (1 << cbits) - 1;
+		cval = 0;
+		if (cbits) {
+			bookNum = f->classMasterbooks[klass];
+			cval = Codebook_DecodeScalar(ctx, &ctx->codebooks[bookNum]);
+		}
+
+		for (j = 0; j < cdim; j++) 
+		{
+			bookNum = f->subclassBooks[klass][cval & csub];
+			cval >>= cbits;
+
+			if (bookNum >= 0) {
+				yList[idx + j] = Codebook_DecodeScalar(ctx, &ctx->codebooks[bookNum]);
+			} else {
+				yList[idx + j] = 0;
+			}
+		}
+		idx += cdim;
+	}
+	return true;
+}
+
+/* Vorbis spec 9.2.6. render_point */
+static int Floor_RenderPoint(int x0, int y0, int x1, int y1, int X) {
+	int dy  = y1 - y0, adx = x1 - x0;
+	int ady = Math_AbsI(dy);
+	int err = ady * (X - x0);
+	int off = err / adx;
+
+	if (dy < 0) {
+		return y0 - off;
+	} else {
+		return y0 + off;
+	}
+}
+
+/* Vorbis spec 9.2.7. render_line */
+static void Floor_RenderLine(int x0, int y0, int x1, int y1, float* data) {
+	int dy   = y1 - y0, adx = x1 - x0;
+	int ady  = Math_AbsI(dy);
+	int base = dy / adx, sy;
+	int x    = x0, y = y0, err = 0;
+
+	if (dy < 0) {
+		sy = base - 1;
+	} else {
+		sy = base + 1;
+	}
+
+	ady = ady - Math_AbsI(base) * adx;
+	data[x] *= floor1_inverse_dB_table[y];
+
+	for (x = x0 + 1; x < x1; x++) {
+		err = err + ady;
+		if (err >= adx) {
+			err = err - adx;
+			y = y + sy;
+		} else {
+			y = y + base;
+		}
+		data[x] *= floor1_inverse_dB_table[y];
+	}
+}
+
+/* Vorbis spec 9.2.4. low_neighbor */
+static int low_neighbor(cc_int16* v, int x) {
+	int n = 0, i, max = Int32_MinValue;
+	for (i = 0; i < x; i++) 
+	{
+		if (v[i] < v[x] && v[i] > max) { n = i; max = v[i]; }
+	}
+	return n;
+}
+
+/* Vorbis spec 9.2.5. high_neighbor */
+static int high_neighbor(cc_int16* v, int x) {
+	int n = 0, i, min = Int32_MaxValue;
+	for (i = 0; i < x; i++) 
+	{
+		if (v[i] > v[x] && v[i] < min) { n = i; min = v[i]; }
+	}
+	return n;
+}
+
+static void Floor_Synthesis(struct VorbisState* ctx, struct Floor* f, int ch) {
+	/* amplitude arrays */
+	cc_int32 YFinal[FLOOR_MAX_VALUES];
+	cc_bool Step2[FLOOR_MAX_VALUES];
+	cc_int32* yList;
+	float* data;
+	/* amplitude variables */
+	int lo_offset, hi_offset, predicted;
+	int val, highroom, lowroom, room;
+	int i;
+	/* curve variables */
+	int lx, hx, ly, hy;
+	int rawI;
+	float value;
+
+	/* amplitude value synthesis */
+	yList = f->yList[ch];
+	data  = ctx->curOutput[ch];
+
+	Step2[0]  = true;
+	Step2[1]  = true;
+	YFinal[0] = yList[0];
+	YFinal[1] = yList[1];
+
+	for (i = 2; i < f->values; i++) 
+	{
+		lo_offset = low_neighbor(f->xList, i);
+		hi_offset = high_neighbor(f->xList, i);
+		predicted = Floor_RenderPoint(f->xList[lo_offset], YFinal[lo_offset],
+									  f->xList[hi_offset], YFinal[hi_offset], f->xList[i]);
+
+		val      = yList[i];
+		highroom = f->range - predicted;
+		lowroom  = predicted;
+
+		if (highroom < lowroom) {
+			room = highroom * 2;
+		} else {
+			room = lowroom * 2;
+		}
+
+		if (val) {
+			Step2[lo_offset] = true;
+			Step2[hi_offset] = true;
+			Step2[i] = true;
+
+			if (val >= room) {
+				if (highroom > lowroom) {
+					YFinal[i] = val - lowroom + predicted;
+				} else {
+					YFinal[i] = predicted - val + highroom - 1;
+				}
+			} else {
+				if (val & 1) {
+					YFinal[i] = predicted - (val + 1) / 2;
+				} else {
+					YFinal[i] = predicted + val / 2;
+				}
+			}
+		} else {
+			Step2[i]  = false;
+			YFinal[i] = predicted;
+		}
+	}
+
+	/* curve synthesis */ 
+	lx = 0; ly = YFinal[f->listOrder[0]] * f->multiplier; 
+	hx = 0; hy = ly;
+
+	for (rawI = 1; rawI < f->values; rawI++) 
+	{
+		i = f->listOrder[rawI];
+		if (!Step2[i]) continue;
+
+		hx = f->xList[i]; hy = YFinal[i] * f->multiplier;
+		if (lx < hx) {
+			Floor_RenderLine(lx, ly, min(hx, ctx->dataSize), hy, data);
+		}
+		lx = hx; ly = hy;
+	}
+
+	/* fill remainder of floor with a flat line */
+	/* TODO: Is this right? should hy be 0, if Step2 is false for all */
+	if (hx >= ctx->dataSize) return;
+	lx = hx; hx = ctx->dataSize;
+
+	value = floor1_inverse_dB_table[hy];
+	for (; lx < hx; lx++) { data[lx] *= value; }
+}
+
+
+/*########################################################################################################################*
+*----------------------------------------------------Vorbis residues------------------------------------------------------*
+*#########################################################################################################################*/
+#define RESIDUE_MAX_CLASSIFICATIONS 65
+struct Residue {
+	cc_uint8  type, classifications, classbook;
+	cc_uint32 begin, end, partitionSize;
+	cc_uint8  cascade[RESIDUE_MAX_CLASSIFICATIONS];
+	cc_int16  books[RESIDUE_MAX_CLASSIFICATIONS][8];
+};
+
+static cc_result Residue_DecodeSetup(struct VorbisState* ctx, struct Residue* r, int type) {
+	cc_int16 codebook;
+	int i, j;
+
+	r->type  = (cc_uint8)type;
+	r->begin = Vorbis_ReadBits(ctx, 24);
+	r->end   = Vorbis_ReadBits(ctx, 24);
+	r->partitionSize   = Vorbis_ReadBits(ctx, 24) + 1;
+	r->classifications = Vorbis_ReadBits(ctx, 6)  + 1;
+	r->classbook       = Vorbis_ReadBits(ctx, 8);
+
+	for (i = 0; i < r->classifications; i++) 
+	{
+		r->cascade[i] = Vorbis_ReadBits(ctx, 3);
+		if (!Vorbis_ReadBit(ctx)) continue;
+		r->cascade[i] |= Vorbis_ReadBits(ctx, 5) << 3;
+	}
+
+	for (i = 0; i < r->classifications; i++) 
+	{
+		for (j = 0; j < 8; j++) 
+		{
+			codebook = -1;
+
+			if (r->cascade[i] & (1 << j)) {
+				codebook = Vorbis_ReadBits(ctx, 8);
+			}
+			r->books[i][j] = codebook;
+		}
+	}
+	return 0;
+}
+
+static void Residue_DecodeCore(struct VorbisState* ctx, struct Residue* r, cc_uint32 size, int ch, cc_bool* doNotDecode, float** data) {
+	struct Codebook* classbook;
+	cc_uint32 residueBeg, residueEnd;
+	cc_uint32 classwordsPerCodeword;
+	cc_uint32 nToRead, partitionsToRead;
+	int pass, i, j, k;
+
+	/* classification variables */
+	cc_uint8* classifications[VORBIS_MAX_CHANS];
+	cc_uint8* classifications_raw;
+	cc_uint32 temp;
+
+	/* partition variables */
+	struct Codebook* c;
+	float* v;
+	cc_uint32 offset;
+	cc_uint8 klass;
+	cc_int16 book;
+
+	/* per spec, ensure decoded bounds are actually in size */
+	residueBeg = min(r->begin, size);
+	residueEnd = min(r->end,   size);
+	classbook = &ctx->codebooks[r->classbook];
+
+	classwordsPerCodeword = classbook->dimensions;
+	nToRead = residueEnd - residueBeg;
+	partitionsToRead = nToRead / r->partitionSize;
+
+	/* first half of temp array is used by residue type 2 for storing temp interleaved data */
+	classifications_raw = ((cc_uint8*)ctx->temp) + (ctx->dataSize * ctx->channels * 5);
+	for (i = 0; i < ch; i++) 
+	{
+		/* add a bit of space in case classwordsPerCodeword is > partitionsToRead*/
+		classifications[i] = classifications_raw + i * (partitionsToRead + 64);
+	}
+
+	if (nToRead == 0) return;
+	for (pass = 0; pass < 8; pass++) 
+	{
+		cc_uint32 partitionCount = 0;
+		while (partitionCount < partitionsToRead) {
+
+			/* read classifications in pass 0 */
+			if (pass == 0) {
+				for (j = 0; j < ch; j++) 
+				{
+					if (doNotDecode[j]) continue;
+
+					temp = Codebook_DecodeScalar(ctx, classbook);
+					for (i = classwordsPerCodeword - 1; i >= 0; i--) 
+					{
+						classifications[j][i + partitionCount] = temp % r->classifications;
+						temp /= r->classifications;
+					}
+				}
+			}
+
+			for (i = 0; i < classwordsPerCodeword && partitionCount < partitionsToRead; i++) 
+			{
+				for (j = 0; j < ch; j++) 
+				{
+					if (doNotDecode[j]) continue;
+
+					klass = classifications[j][partitionCount];
+					book  = r->books[klass][pass];
+					if (book < 0) continue;
+
+					offset = residueBeg + partitionCount * r->partitionSize;
+					v = data[j] + offset;
+					c = &ctx->codebooks[book];
+
+					if (r->type == 0) {
+						int step = r->partitionSize / c->dimensions;
+						for (k = 0; k < step; k++) 
+						{
+							Codebook_DecodeVectors(ctx, c, v, step); v++;
+						}
+					} else {
+						for (k = 0; k < r->partitionSize; k += c->dimensions) 
+						{
+							Codebook_DecodeVectors(ctx, c, v, 1); v += c->dimensions;
+						}
+					}
+				}
+				partitionCount++;
+			}
+		}
+	}
+}
+
+static void Residue_DecodeFrame(struct VorbisState* ctx, struct Residue* r, int ch, cc_bool* doNotDecode, float** data) {
+	cc_uint32 size = ctx->dataSize;
+	float* interleaved;
+	cc_bool decodeAny;
+	int i, j;
+
+	if (r->type == 2) {
+		decodeAny = false;
+
+		/* type 2 decodes all channel vectors, if at least 1 channel to decode */
+		for (i = 0; i < ch; i++) 
+		{
+			if (!doNotDecode[i]) decodeAny = true;
+		}
+		if (!decodeAny) return;
+		decodeAny = false; /* because DecodeCore expects this to be 'false' for 'do not decode' */
+
+		interleaved = ctx->temp;
+		/* TODO: avoid using ctx->temp and deinterleaving at all */
+		/* TODO: avoid setting memory to 0 here */
+		Mem_Set(interleaved, 0, ctx->dataSize * ctx->channels * sizeof(float));
+		Residue_DecodeCore(ctx, r, size * ch, 1, &decodeAny, &interleaved);
+
+		/* deinterleave type 2 output */	
+		for (i = 0; i < size; i++) 
+		{
+			for (j = 0; j < ch; j++) 
+			{
+				data[j][i] = interleaved[i * ch + j];
+			}
+		}
+	} else {
+		Residue_DecodeCore(ctx, r, size, ch, doNotDecode, data);
+	}
+}
+
+
+/*########################################################################################################################*
+*----------------------------------------------------Vorbis mappings------------------------------------------------------*
+*#########################################################################################################################*/
+#define MAPPING_MAX_COUPLINGS 256
+#define MAPPING_MAX_SUBMAPS 15
+struct Mapping {
+	cc_uint8 couplingSteps, submaps;
+	cc_uint8 mux[VORBIS_MAX_CHANS];
+	cc_uint8 floorIdx[MAPPING_MAX_SUBMAPS];
+	cc_uint8 residueIdx[MAPPING_MAX_SUBMAPS];
+	cc_uint8 magnitude[MAPPING_MAX_COUPLINGS];
+	cc_uint8 angle[MAPPING_MAX_COUPLINGS];
+};
+
+static cc_result Mapping_DecodeSetup(struct VorbisState* ctx, struct Mapping* m) {
+	int i, submaps, reserved;
+	int couplingSteps, couplingBits;
+
+	submaps = 1;
+	if (Vorbis_ReadBit(ctx)) {
+		submaps = Vorbis_ReadBits(ctx, 4) + 1;
+	}
+
+	couplingSteps = 0;
+	if (Vorbis_ReadBit(ctx)) {
+		couplingSteps = Vorbis_ReadBits(ctx, 8) + 1;
+		/* TODO: How big can couplingSteps ever really get in practice? */
+		couplingBits  = iLog(ctx->channels - 1);
+
+		for (i = 0; i < couplingSteps; i++) 
+		{
+			m->magnitude[i] = Vorbis_ReadBits(ctx, couplingBits);
+			m->angle[i]     = Vorbis_ReadBits(ctx, couplingBits);
+			if (m->magnitude[i] == m->angle[i]) return VORBIS_ERR_MAPPING_CHANS;
+		}
+	}
+
+	reserved = Vorbis_ReadBits(ctx, 2);
+	if (reserved != 0) return VORBIS_ERR_MAPPING_RESERVED;
+	m->submaps = submaps;
+	m->couplingSteps = couplingSteps;
+
+	if (submaps > 1) {
+		for (i = 0; i < ctx->channels; i++) 
+		{
+			m->mux[i] = Vorbis_ReadBits(ctx, 4);
+		}
+	} else {
+		for (i = 0; i < ctx->channels; i++) 
+		{
+			m->mux[i] = 0;
+		}
+	}
+
+	for (i = 0; i < submaps; i++) 
+	{
+		Vorbis_ReadBits(ctx, 8); /* time value */
+		m->floorIdx[i]   = Vorbis_ReadBits(ctx, 8);
+		m->residueIdx[i] = Vorbis_ReadBits(ctx, 8);
+	}
+	return 0;
+}
+
+
+/*########################################################################################################################*
+*------------------------------------------------------imdct impl---------------------------------------------------------*
+*#########################################################################################################################*/
+#define PI MATH_PI
+static cc_uint32 Vorbis_ReverseBits(cc_uint32 v) {
+	v = ((v >> 1) & 0x55555555) | ((v & 0x55555555) << 1);
+	v = ((v >> 2) & 0x33333333) | ((v & 0x33333333) << 2);
+	v = ((v >> 4) & 0x0F0F0F0F) | ((v & 0x0F0F0F0F) << 4);
+	v = ((v >> 8) & 0x00FF00FF) | ((v & 0x00FF00FF) << 8);
+	v = (v >> 16) | (v << 16);
+	return v;
+}
+
+void imdct_init(struct imdct_state* state, int n) {
+	int k, k2, n4 = n >> 2, n8 = n >> 3, log2_n;
+	float *A = state->a, *B = state->b, *C = state->c;
+	cc_uint32* reversed;
+
+	log2_n   = Math_ilog2(n);
+	reversed = state->reversed;
+	state->n = n; state->log2_n = log2_n;
+
+	/* setup twiddle factors */
+	for (k = 0, k2 = 0; k < n4; k++, k2 += 2) 
+	{
+		A[k2]   =  Math_CosF((4*k * PI) / n);
+		A[k2+1] = -Math_SinF((4*k * PI) / n);
+		B[k2]   =  Math_CosF(((k2+1) * PI) / (2*n));
+		B[k2+1] =  Math_SinF(((k2+1) * PI) / (2*n));
+	}
+	for (k = 0, k2 = 0; k < n8; k++, k2 += 2) 
+	{
+		C[k2]   =  Math_CosF(((k2+1) * (2*PI)) / n);
+		C[k2+1] = -Math_SinF(((k2+1) * (2*PI)) / n);
+	}
+
+	for (k = 0; k < n8; k++) 
+	{
+		reversed[k] = Vorbis_ReverseBits(k) >> (32-log2_n+3);
+	}
+}
+
+void imdct_calc(float* in, float* out, struct imdct_state* state) {
+	int k, k2, k4, n = state->n;
+	int n2 = n >> 1, n4 = n >> 2, n8 = n >> 3, n3_4 = n - n4;
+	int l, log2_n;
+	cc_uint32* reversed;
+	
+	/* Optimised algorithm from "The use of multirate filter banks for coding of high quality digital audio" */
+	/* Uses a few fixes for the paper noted at http://www.nothings.org/stb_vorbis/mdct_01.txt */
+	float *A = state->a, *B = state->b, *C = state->c;
+
+	float u[VORBIS_MAX_BLOCK_SIZE / 2];
+	float w[VORBIS_MAX_BLOCK_SIZE / 2];
+	float e_1, e_2, f_1, f_2;
+	float g_1, g_2, h_1, h_2;
+	float x_1, x_2, y_1, y_2;
+
+
+	/* spectral coefficients, step 1, step 2 */ /* TODO avoid k */
+	for (k = 0, k2 = 0, k4 = 0; k < n8; k++, k2 += 2, k4 += 4) 
+	{
+		e_1 = -in[k4+3];   e_2 = -in[k4+1];
+		g_1 = e_1 * A[n2-1-k2] + e_2 * A[n2-2-k2];
+		g_2 = e_1 * A[n2-2-k2] - e_2 * A[n2-1-k2];
+
+		f_1 = in[n2-4-k4]; f_2 = in[n2-2-k4];
+		h_2 = f_1 * A[n4-2-k2] - f_2 * A[n4-1-k2];
+		h_1 = f_1 * A[n4-1-k2] + f_2 * A[n4-2-k2];
+
+		w[n4+1+k2] = h_2 + g_2;
+		w[n4+0+k2] = h_1 + g_1;
+
+		w[k2+1] = (h_2 - g_2) * A[n2-4-k4] - (h_1 - g_1) * A[n2-3-k4];
+		w[k2+0] = (h_1 - g_1) * A[n2-4-k4] + (h_2 - g_2) * A[n2-3-k4];
+	}
+
+	/* step 3 */
+	log2_n = state->log2_n;
+	for (l = 0; l <= log2_n - 4; l++) 
+	{
+		int k0 = n >> (l+3), k1 = 1 << (l+3);
+		int r, r2, rMax = n >> (l+4), s2, s2Max = 1 << (l+2);
+
+		for (r = 0, r2 = 0; r < rMax; r++, r2 += 2) 
+		{
+			for (s2 = 0; s2 < s2Max; s2 += 2) 
+			{
+				e_1 = w[n2-1-k0*s2-r2];     
+				e_2 = w[n2-2-k0*s2-r2];
+				f_1 = w[n2-1-k0*(s2+1)-r2]; 
+				f_2 = w[n2-2-k0*(s2+1)-r2];
+
+				u[n2-1-k0*s2-r2]     = e_1 + f_1;
+				u[n2-2-k0*s2-r2]     = e_2 + f_2;
+				u[n2-1-k0*(s2+1)-r2] = (e_1 - f_1) * A[r*k1] - (e_2 - f_2) * A[r*k1+1];
+				u[n2-2-k0*(s2+1)-r2] = (e_2 - f_2) * A[r*k1] + (e_1 - f_1) * A[r*k1+1];
+			}
+		}
+
+		/* TODO: eliminate this, do w/u in-place */
+		/* TODO: dynamically allocate mem for imdct */
+		if (l+1 <= log2_n - 4) {
+			Mem_Copy(w, u, n2 * sizeof(float));
+		}
+	}
+
+	/* step 4, step 5, step 6, step 7, step 8, output */
+	reversed = state->reversed;
+	for (k = 0, k2 = 0; k < n8; k++, k2 += 2) 
+	{
+		cc_uint32 j = reversed[k], j4 = j << 2;
+		e_1 = u[n2-j4-1]; e_2 = u[n2-j4-2];
+		f_1 = u[j4+1];    f_2 = u[j4+0];
+
+		g_1 =  e_1 + f_1 + C[k2+1] * (e_1 - f_1) + C[k2] * (e_2 + f_2);
+		h_1 =  e_1 + f_1 - C[k2+1] * (e_1 - f_1) - C[k2] * (e_2 + f_2);
+		g_2 =  e_2 - f_2 + C[k2+1] * (e_2 + f_2) - C[k2] * (e_1 - f_1);
+		h_2 = -e_2 + f_2 + C[k2+1] * (e_2 + f_2) - C[k2] * (e_1 - f_1);
+
+		x_1 = -0.5f * (g_1 * B[k2]   + g_2 * B[k2+1]);
+		x_2 = -0.5f * (g_1 * B[k2+1] - g_2 * B[k2]);
+		out[n4-1-k]   = -x_2;
+		out[n4+k]     =  x_2;
+		out[n3_4-1-k] =  x_1;
+		out[n3_4+k]   =  x_1;
+
+		y_1 = -0.5f * (h_1 * B[n2-2-k2] + h_2 * B[n2-1-k2]);
+		y_2 = -0.5f * (h_1 * B[n2-1-k2] - h_2 * B[n2-2-k2]);
+		out[k]      = -y_2;
+		out[n2-1-k] =  y_2;
+		out[n2+k]   =  y_1;
+		out[n-1-k]  =  y_1;
+	}
+}
+
+
+/*########################################################################################################################*
+*-----------------------------------------------------Vorbis setup--------------------------------------------------------*
+*#########################################################################################################################*/
+struct Mode { cc_uint8 blockSizeFlag, mappingIdx; };
+static cc_result Mode_DecodeSetup(struct VorbisState* ctx, struct Mode* m) {
+	int windowType, transformType;
+	m->blockSizeFlag = Vorbis_ReadBit(ctx);
+
+	windowType    = Vorbis_ReadBits(ctx, 16);
+	if (windowType != 0)    return VORBIS_ERR_MODE_WINDOW;
+	transformType = Vorbis_ReadBits(ctx, 16);
+	if (transformType != 0) return VORBIS_ERR_MODE_TRANSFORM;
+
+	m->mappingIdx = Vorbis_ReadBits(ctx, 8);
+	return 0;
+}
+
+static void Vorbis_CalcWindow(struct VorbisWindow* window, int blockSize) {
+	int i, n = blockSize / 2;
+	float *cur_window, *prev_window;
+	double inner;
+
+	window->Cur = window->Prev + n;
+	cur_window  = window->Cur;
+	prev_window = window->Prev;
+
+	for (i = 0; i < n; i++) 
+	{
+		inner          = Math_SinF((i + 0.5f) / n * (PI/2));
+		cur_window[i]  = Math_SinF((PI/2) * inner * inner);
+	}
+	for (i = 0; i < n; i++) 
+	{
+		inner          = Math_SinF((i + 0.5f) / n * (PI/2) + (PI/2));
+		prev_window[i] = Math_SinF((PI/2) * inner * inner);
+	}
+}
+
+void Vorbis_Init(struct VorbisState* ctx) {
+	Mem_Set(ctx, 0, sizeof(*ctx) - sizeof(ctx->imdct));
+}
+
+void Vorbis_Free(struct VorbisState* ctx) {
+	int i;
+	for (i = 0; i < ctx->numCodebooks; i++) 
+	{
+		Codebook_Free(&ctx->codebooks[i]);
+	}
+
+	Mem_Free(ctx->codebooks);
+	Mem_Free(ctx->floors);
+	Mem_Free(ctx->residues);
+	Mem_Free(ctx->mappings);
+	Mem_Free(ctx->modes);
+	Mem_Free(ctx->windowRaw);
+	Mem_Free(ctx->temp);
+}
+
+static cc_bool Vorbis_ValidBlockSize(cc_uint32 size) {
+	return size >= 64 && size <= VORBIS_MAX_BLOCK_SIZE && Math_IsPowOf2(size);
+}
+
+/* Vorbis spec 4.2.1. Common header decode */
+static cc_result Vorbis_CheckHeader(struct VorbisState* ctx, cc_uint8 type) {
+	cc_uint8 header[7];
+	cc_bool OK;
+	cc_result res;
+
+	if ((res = Ogg_Read(ctx->source, header, sizeof(header)))) return res;
+	if (header[0] != type) return VORBIS_ERR_WRONG_HEADER;
+
+	OK = 
+		header[1] == 'v' && header[2] == 'o' && header[3] == 'r' &&
+		header[4] == 'b' && header[5] == 'i' && header[6] == 's';
+	return OK ? 0 : ERR_INVALID_ARGUMENT;
+}
+
+/* Vorbis spec 4.2.2. Identification header */
+static cc_result Vorbis_DecodeIdentifier(struct VorbisState* ctx) {
+	cc_uint8 header[23];
+	cc_uint32 version;
+	cc_result res;
+
+	if ((res = Ogg_Read(ctx->source, header, sizeof(header)))) return res;
+	version  = Stream_GetU32_LE(&header[0]);
+	if (version != 0) return VORBIS_ERR_VERSION;
+
+	ctx->channels   = header[4];
+	ctx->sampleRate = Stream_GetU32_LE(&header[5]);
+	/* (12) bitrate_maximum, nominal, minimum */
+	ctx->blockSizes[0] = 1 << (header[21] & 0xF);
+	ctx->blockSizes[1] = 1 << (header[21] >>  4);
+
+	if (!Vorbis_ValidBlockSize(ctx->blockSizes[0])) return VORBIS_ERR_BLOCKSIZE;
+	if (!Vorbis_ValidBlockSize(ctx->blockSizes[1])) return VORBIS_ERR_BLOCKSIZE;
+	if (ctx->blockSizes[0] > ctx->blockSizes[1])    return VORBIS_ERR_BLOCKSIZE;
+
+	if (ctx->channels == 0 || ctx->channels > VORBIS_MAX_CHANS) return VORBIS_ERR_CHANS;
+	/* check framing flag */
+	return (header[22] & 1) ? 0 : VORBIS_ERR_FRAMING;
+}
+
+/* Vorbis spec 4.2.3. Comment header */
+static cc_result Vorbis_DecodeComments(struct VorbisState* ctx) {
+	cc_uint32 i, len, comments;
+	cc_uint8 flag;
+	cc_result res;
+	struct OggState* source = ctx->source;
+
+	/* vendor name, followed by comments */
+	if ((res = Ogg_ReadU32(source, &len)))      return res;
+	if ((res = Ogg_Skip(source, len)))          return res;
+	if ((res = Ogg_ReadU32(source, &comments))) return res;
+
+	for (i = 0; i < comments; i++) 
+	{
+		/* comments such as artist, year, etc */
+		if ((res = Ogg_ReadU32(source, &len))) return res;
+		if ((res = Ogg_Skip(source, len)))     return res;
+	}
+
+	/* check framing flag */
+	if ((res = Ogg_ReadU8(source, &flag))) return res;
+	return (flag & 1) ? 0 : VORBIS_ERR_FRAMING;
+}
+
+/* Vorbis spec 4.2.4. Setup header */
+static cc_result Vorbis_DecodeSetup(struct VorbisState* ctx) {
+	cc_uint32 framing, alignSkip;
+	int i, count;
+	cc_result res;
+
+	count = Vorbis_ReadBits(ctx, 8) + 1;
+	ctx->codebooks = (struct Codebook*)Mem_TryAlloc(count, sizeof(struct Codebook));
+	if (!ctx->codebooks) return ERR_OUT_OF_MEMORY;
+
+	for (i = 0; i < count; i++) 
+	{
+		res = Codebook_DecodeSetup(ctx, &ctx->codebooks[i]);
+		if (res) return res;
+	}
+	ctx->numCodebooks = count;
+
+	count = Vorbis_ReadBits(ctx, 6) + 1;
+	for (i = 0; i < count; i++) 
+	{
+		int time = Vorbis_ReadBits(ctx, 16);
+		if (time != 0) return VORBIS_ERR_TIME_TYPE;
+	}
+
+	count = Vorbis_ReadBits(ctx, 6) + 1;
+	ctx->floors = (struct Floor*)Mem_TryAlloc(count, sizeof(struct Floor));
+	if (!ctx->floors) return ERR_OUT_OF_MEMORY;
+
+	for (i = 0; i < count; i++) 
+	{
+		int floor = Vorbis_ReadBits(ctx, 16);
+		if (floor != 1) return VORBIS_ERR_FLOOR_TYPE;
+
+		res = Floor_DecodeSetup(ctx, &ctx->floors[i]);
+		if (res) return res;
+	}
+
+	count = Vorbis_ReadBits(ctx, 6) + 1;
+	ctx->residues = (struct Residue*)Mem_TryAlloc(count, sizeof(struct Residue));
+	if (!ctx->residues) return ERR_OUT_OF_MEMORY;
+
+	for (i = 0; i < count; i++) 
+	{
+		int residue = Vorbis_ReadBits(ctx, 16);
+		if (residue > 2) return VORBIS_ERR_FLOOR_TYPE;
+
+		res = Residue_DecodeSetup(ctx, &ctx->residues[i], residue);
+		if (res) return res;
+	}
+
+	count = Vorbis_ReadBits(ctx, 6) + 1;
+	ctx->mappings = (struct Mapping*)Mem_TryAlloc(count, sizeof(struct Mapping));
+	if (!ctx->mappings) return ERR_OUT_OF_MEMORY;
+
+	for (i = 0; i < count; i++) 
+	{
+		int mapping = Vorbis_ReadBits(ctx, 16);
+		if (mapping != 0) return VORBIS_ERR_MAPPING_TYPE;
+
+		res = Mapping_DecodeSetup(ctx, &ctx->mappings[i]);
+		if (res) return res;
+	}
+
+	count = Vorbis_ReadBits(ctx, 6) + 1;
+	ctx->modes = (struct Mode*)Mem_TryAlloc(count, sizeof(struct Mode));
+	if (!ctx->modes) return ERR_OUT_OF_MEMORY;
+
+	for (i = 0; i < count; i++) 
+	{
+		res = Mode_DecodeSetup(ctx, &ctx->modes[i]);
+		if (res) return res;
+	}
+	
+	ctx->modeNumBits = iLog(count - 1); /* ilog([vorbis_mode_count]-1) bits */
+	framing = Vorbis_ReadBit(ctx);
+	Vorbis_AlignBits(ctx);
+	/* check framing flag */
+	return (framing & 1) ? 0 : VORBIS_ERR_FRAMING;
+}
+
+/* Vorbis spec 4.2. Header decode and decode setup */
+cc_result Vorbis_DecodeHeaders(struct VorbisState* ctx) {
+	cc_uint32 count;
+	cc_result res;
+	
+	if ((res = Vorbis_CheckHeader(ctx, 1)))   return res;
+	if ((res = Vorbis_DecodeIdentifier(ctx))) return res;
+	Ogg_DiscardPacket(ctx->source);
+
+	if ((res = Vorbis_CheckHeader(ctx, 3)))   return res;
+	if ((res = Vorbis_DecodeComments(ctx)))   return res;
+	Ogg_DiscardPacket(ctx->source);
+
+	if ((res = Vorbis_CheckHeader(ctx, 5)))   return res;
+	if ((res = Vorbis_DecodeSetup(ctx)))      return res;
+	Ogg_DiscardPacket(ctx->source);
+
+	/* window calculations can be pre-computed here */
+	count = ctx->blockSizes[0] + ctx->blockSizes[1];
+	ctx->windowRaw = (float*)Mem_TryAlloc(count, sizeof(float));
+	if (!ctx->windowRaw) return ERR_OUT_OF_MEMORY;
+
+	ctx->windows[0].Prev = ctx->windowRaw;
+	ctx->windows[1].Prev = ctx->windowRaw + ctx->blockSizes[0];
+
+	Vorbis_CalcWindow(&ctx->windows[0], ctx->blockSizes[0]);
+	Vorbis_CalcWindow(&ctx->windows[1], ctx->blockSizes[1]);
+
+	count     = ctx->channels * ctx->blockSizes[1];
+	ctx->temp = (float*)Mem_TryAllocCleared(count * 3, sizeof(float));
+	if (!ctx->temp) return ERR_OUT_OF_MEMORY;
+
+	ctx->values[0] = ctx->temp + count;
+	ctx->values[1] = ctx->temp + count * 2;
+
+	imdct_init(&ctx->imdct[0], ctx->blockSizes[0]);
+	imdct_init(&ctx->imdct[1], ctx->blockSizes[1]);
+	return 0;
+}
+
+
+/*########################################################################################################################*
+*-----------------------------------------------------Vorbis frame--------------------------------------------------------*
+*#########################################################################################################################*/
+/* Vorbis spec 4.3. Audio packet decode and synthesis */
+cc_result Vorbis_DecodeFrame(struct VorbisState* ctx) {
+	/* frame header */
+	cc_uint32 packetType;
+	struct Mapping* mapping;
+	struct Mode* mode;
+	int modeIdx;
+
+	/* floor/residue */
+	cc_bool hasFloor[VORBIS_MAX_CHANS];
+	cc_bool hasResidue[VORBIS_MAX_CHANS];
+	cc_bool doNotDecode[VORBIS_MAX_CHANS];
+	float* data[VORBIS_MAX_CHANS];
+	int submap, floorIdx;
+	int ch, residueIdx;
+
+	/* inverse coupling */
+	int magChannel, angChannel;
+	float* magValues, m;
+	float* angValues, a;
+
+	/* misc variables */
+	float* tmp;
+	cc_uint32 alignSkip;
+	int i, j; 
+	cc_result res;
+	
+	res = Vorbis_TryReadBits(ctx, 1, &packetType);
+	if (res) return res;
+	if (packetType) return VORBIS_ERR_FRAME_TYPE;
+
+	modeIdx = Vorbis_ReadBits(ctx, ctx->modeNumBits);
+	mode    = &ctx->modes[modeIdx];
+	mapping = &ctx->mappings[mode->mappingIdx];
+
+	/* decode window shape */
+	ctx->curBlockSize = ctx->blockSizes[mode->blockSizeFlag];
+	ctx->dataSize     = ctx->curBlockSize / 2;
+	/* long window lapping flags - we don't care about them though */
+	if (mode->blockSizeFlag) { Vorbis_ReadBits(ctx, 2); } /* TODO: do we just SkipBits here */
+
+	/* swap prev and cur outputs around */
+	tmp = ctx->values[1]; ctx->values[1] = ctx->values[0]; ctx->values[0] = tmp;
+	Mem_Set(ctx->values[0], 0, ctx->channels * ctx->curBlockSize);
+
+	for (i = 0; i < ctx->channels; i++) 
+	{
+		ctx->curOutput[i]  = ctx->values[0] + i * ctx->curBlockSize;
+		ctx->prevOutput[i] = ctx->values[1] + i * ctx->prevBlockSize;
+	}
+
+	/* decode floor */
+	for (i = 0; i < ctx->channels; i++) 
+	{
+		submap   = mapping->mux[i];
+		floorIdx = mapping->floorIdx[submap];
+		hasFloor[i]   = Floor_DecodeFrame(ctx, &ctx->floors[floorIdx], i);
+		hasResidue[i] = hasFloor[i];
+	}
+
+	/* non-zero vector propogate */
+	for (i = 0; i < mapping->couplingSteps; i++) 
+	{
+		magChannel = mapping->magnitude[i];
+		angChannel = mapping->angle[i];
+
+		if (hasResidue[magChannel] || hasResidue[angChannel]) {
+			hasResidue[magChannel] = true; hasResidue[angChannel] = true;
+		}
+	}
+
+	/* decode residue */
+	for (i = 0; i < mapping->submaps; i++) 
+	{
+		ch = 0;
+		/* map residue data to actual channel data */
+		for (j = 0; j < ctx->channels; j++) 
+		{
+			if (mapping->mux[j] != i) continue;
+
+			doNotDecode[ch] = !hasResidue[j];
+			data[ch] = ctx->curOutput[j];
+			ch++;
+		}
+
+		residueIdx = mapping->floorIdx[i];
+		Residue_DecodeFrame(ctx, &ctx->residues[residueIdx], ch, doNotDecode, data);
+	}
+
+	/* inverse coupling */
+	for (i = mapping->couplingSteps - 1; i >= 0; i--) 
+	{
+		magValues = ctx->curOutput[mapping->magnitude[i]];
+		angValues = ctx->curOutput[mapping->angle[i]];
+
+		for (j = 0; j < ctx->dataSize; j++) 
+		{
+			m = magValues[j]; a = angValues[j];
+
+			if (m > 0.0f) {
+				if (a > 0.0f) { angValues[j] = m - a; }
+				else {
+					angValues[j] = m;
+					magValues[j] = m + a;
+				}
+			} else {
+				if (a > 0.0f) { angValues[j] = m + a; }
+				else {
+					angValues[j] = m;
+					magValues[j] = m - a;
+				}
+			}
+		}
+	}
+
+	/* compute dot product of floor and residue, producing audio spectrum vector */
+	for (i = 0; i < ctx->channels; i++) 
+	{
+		if (!hasFloor[i]) continue;
+
+		submap   = mapping->mux[i];
+		floorIdx = mapping->floorIdx[submap];
+		Floor_Synthesis(ctx, &ctx->floors[floorIdx], i);
+	}
+
+	/* inverse monolithic transform of audio spectrum vector */
+	for (i = 0; i < ctx->channels; i++) 
+	{
+		tmp = ctx->curOutput[i];
+
+		if (!hasFloor[i]) {
+			/* TODO: Do we actually need to zero data here (residue type 2 maybe) */
+			Mem_Set(tmp, 0, ctx->curBlockSize * sizeof(float));
+		} else {
+			imdct_calc(tmp, tmp, &ctx->imdct[mode->blockSizeFlag]);
+			/* defer windowing until output */
+		}
+	}
+
+	/* discard remaining bits at end of packet */
+	Vorbis_AlignBits(ctx);
+	return 0;
+}
+
+int Vorbis_OutputFrame(struct VorbisState* ctx, cc_int16* data) {
+	struct VorbisWindow window;
+	float* prev[VORBIS_MAX_CHANS];
+	float*  cur[VORBIS_MAX_CHANS];
+
+	int curQrtr, prevQrtr, overlapQtr;
+	int curOffset, prevOffset, overlapSize;
+	float sample;
+	int i, ch;
+
+	/* first frame decoded has no data */
+	if (ctx->prevBlockSize == 0) {
+		ctx->prevBlockSize = ctx->curBlockSize;
+		return 0;
+	}
+
+	/* data returned is from centre of previous block to centre of current block */
+	/* data is aligned, such that 3/4 of prev block is aligned to 1/4 of cur block */
+	curQrtr   = ctx->curBlockSize  / 4;
+	prevQrtr  = ctx->prevBlockSize / 4;
+	overlapQtr = min(curQrtr, prevQrtr);
+	
+	/* So for example, consider a short block overlapping with a long block
+	   a) we need to chop off 'prev' before its halfway point
+	   b) then need to chop off the 'cur' before the halfway point of 'prev'
+	             |-   ********|*****                        |-   ********|
+	            -| - *        |     ***                     | - *        |
+	           - |  #         |        ***          ===>    |  #         |
+	          -  | * -        |           ***               | * -        |
+	   ******-***|*   -       |              ***            |*   -       |
+	*/	
+	curOffset  = curQrtr  - overlapQtr;
+	prevOffset = prevQrtr - overlapQtr;
+
+	for (i = 0; i < ctx->channels; i++) 
+	{
+		prev[i] = ctx->prevOutput[i] + (prevQrtr * 2);
+		cur[i]  = ctx->curOutput[i];
+	}
+
+	/* for long prev and short cur block, there will be non-overlapped data before */
+	for (i = 0; i < prevOffset; i++) 
+	{
+		for (ch = 0; ch < ctx->channels; ch++) 
+		{
+			sample = prev[ch][i];
+			Math_Clamp(sample, -1.0f, 1.0f);
+			*data++ = (cc_int16)(sample * 32767);
+		}
+	}
+
+	/* adjust pointers to start at 0 for overlapping */
+	for (i = 0; i < ctx->channels; i++) 
+	{
+		prev[i] += prevOffset; cur[i] += curOffset;
+	}
+
+	overlapSize = overlapQtr * 2;
+	window = ctx->windows[(overlapQtr * 4) == ctx->blockSizes[1]];
+
+	/* overlap and add data */
+	/* also perform windowing here */
+	for (i = 0; i < overlapSize; i++) 
+	{
+		for (ch = 0; ch < ctx->channels; ch++) 
+		{
+			sample = prev[ch][i] * window.Prev[i] + cur[ch][i] * window.Cur[i];
+			Math_Clamp(sample, -1.0f, 1.0f);
+			*data++ = (cc_int16)(sample * 32767);
+		}
+	}
+
+	/* for long cur and short prev block, there will be non-overlapped data after */
+	for (i = 0; i < ctx->channels; i++) { cur[i] += overlapSize; }
+	for (i = 0; i < curOffset; i++) 
+	{
+		for (ch = 0; ch < ctx->channels; ch++) 
+		{
+			sample = cur[ch][i];
+			Math_Clamp(sample, -1.0f, 1.0f);
+			*data++ = (cc_int16)(sample * 32767);
+		}
+	}
+
+	ctx->prevBlockSize = ctx->curBlockSize;
+	return (prevQrtr + curQrtr) * ctx->channels;
+}