src/siege/internal/stb/stb

Bug Summary

File:	c:\siege\siege/src/siege/internal/stb/stb_vorbis.c
Location:	line 5239, column 22
Description:	Value stored to 'z' is never read

Annotated Source Code

1	// Ogg Vorbis I audio decoder -- version 0.99996
2	//
3	// Written in April 2007 by Sean Barrett, sponsored by RAD Game Tools.
4	//
5	// Placed in the public domain April 2007 by the author: no copyright is
6	// claimed, and you may use it for any purpose you like.
7	//
8	// No warranty for any purpose is expressed or implied by the author (nor
9	// by RAD Game Tools). Report bugs and send enhancements to the author.
10	//
11	// Get the latest version and other information at:
12	// http://nothings.org/stb_vorbis/
13
14
15	// Todo:
16	//
17	// - seeking (note you can seek yourself using the pushdata API)
18	//
19	// Limitations:
20	//
21	// - floor 0 not supported (used in old ogg vorbis files)
22	// - lossless sample-truncation at beginning ignored
23	// - cannot concatenate multiple vorbis streams
24	// - sample positions are 32-bit, limiting seekable 192Khz
25	// files to around 6 hours (Ogg supports 64-bit)
26	//
27	// All of these limitations may be removed in future versions.
28
29
30	//////////////////////////////////////////////////////////////////////////////
31	//
32	// HEADER BEGINS HERE
33	//
34
35	#ifndef STB_VORBIS_INCLUDE_STB_VORBIS_H
36	#define STB_VORBIS_INCLUDE_STB_VORBIS_H
37
38	#if defined(STB_VORBIS_NO_CRT) && !defined(STB_VORBIS_NO_STDIO)
39	#define STB_VORBIS_NO_STDIO 1
40	#endif
41
42	#ifndef STB_VORBIS_NO_STDIO
43	#include <stdio.h>
44	#endif
45
46	#ifdef __cplusplus
47	extern "C" {
48	#endif
49
50	/////////// THREAD SAFETY
51
52	// Individual stb_vorbis* handles are not thread-safe; you cannot decode from
53	// them from multiple threads at the same time. However, you can have multiple
54	// stb_vorbis* handles and decode from them independently in multiple thrads.
55
56
57	/////////// MEMORY ALLOCATION
58
59	// normally stb_vorbis uses malloc() to allocate memory at startup,
60	// and alloca() to allocate temporary memory during a frame on the
61	// stack. (Memory consumption will depend on the amount of setup
62	// data in the file and how you set the compile flags for speed
63	// vs. size. In my test files the maximal-size usage is ~150KB.)
64	//
65	// You can modify the wrapper functions in the source (setup_malloc,
66	// setup_temp_malloc, temp_malloc) to change this behavior, or you
67	// can use a simpler allocation model: you pass in a buffer from
68	// which stb_vorbis will allocate _all_ its memory (including the
69	// temp memory). "open" may fail with a VORBIS_outofmem if you
70	// do not pass in enough data; there is no way to determine how
71	// much you do need except to succeed (at which point you can
72	// query get_info to find the exact amount required. yes I know
73	// this is lame).
74	//
75	// If you pass in a non-NULL buffer of the type below, allocation
76	// will occur from it as described above. Otherwise just pass NULL
77	// to use malloc()/alloca()
78
79	typedef struct
80	{
81	char *alloc_buffer;
82	int alloc_buffer_length_in_bytes;
83	} stb_vorbis_alloc;
84
85
86	/////////// FUNCTIONS USEABLE WITH ALL INPUT MODES
87
88	typedef struct stb_vorbis stb_vorbis;
89
90	typedef struct
91	{
92	unsigned int sample_rate;
93	int channels;
94
95	unsigned int setup_memory_required;
96	unsigned int setup_temp_memory_required;
97	unsigned int temp_memory_required;
98
99	int max_frame_size;
100	} stb_vorbis_info;
101
102	// get general information about the file
103	extern stb_vorbis_info stb_vorbis_get_info(stb_vorbis *f);
104
105	// get the last error detected (clears it, too)
106	extern int stb_vorbis_get_error(stb_vorbis *f);
107
108	// close an ogg vorbis file and free all memory in use
109	extern void stb_vorbis_close(stb_vorbis *f);
110
111	// this function returns the offset (in samples) from the beginning of the
112	// file that will be returned by the next decode, if it is known, or -1
113	// otherwise. after a flush_pushdata() call, this may take a while before
114	// it becomes valid again.
115	// NOT WORKING YET after a seek with PULLDATA API
116	extern int stb_vorbis_get_sample_offset(stb_vorbis *f);
117
118	// returns the current seek point within the file, or offset from the beginning
119	// of the memory buffer. In pushdata mode it returns 0.
120	extern unsigned int stb_vorbis_get_file_offset(stb_vorbis *f);
121
122	/////////// PUSHDATA API
123
124	#ifndef STB_VORBIS_NO_PUSHDATA_API
125
126	// this API allows you to get blocks of data from any source and hand
127	// them to stb_vorbis. you have to buffer them; stb_vorbis will tell
128	// you how much it used, and you have to give it the rest next time;
129	// and stb_vorbis may not have enough data to work with and you will
130	// need to give it the same data again PLUS more. Note that the Vorbis
131	// specification does not bound the size of an individual frame.
132
133	extern stb_vorbis *stb_vorbis_open_pushdata(
134	unsigned char *datablock, int datablock_length_in_bytes,
135	int *datablock_memory_consumed_in_bytes,
136	int *error,
137	stb_vorbis_alloc *alloc_buffer);
138	// create a vorbis decoder by passing in the initial data block containing
139	// the ogg&vorbis headers (you don't need to do parse them, just provide
140	// the first N bytes of the file--you're told if it's not enough, see below)
141	// on success, returns an stb_vorbis *, does not set error, returns the amount of
142	// data parsed/consumed on this call in *datablock_memory_consumed_in_bytes;
143	// on failure, returns NULL on error and sets error, does not change datablock_memory_consumed
144	// if returns NULL and *error is VORBIS_need_more_data, then the input block was
145	// incomplete and you need to pass in a larger block from the start of the file
146
147	extern int stb_vorbis_decode_frame_pushdata(
148	stb_vorbis f, unsigned char datablock, int datablock_length_in_bytes,
149	int channels, // place to write number of float buffers
150	float *output, // place to write float array of float * buffers
151	int *samples // place to write number of output samples
152	);
153	// decode a frame of audio sample data if possible from the passed-in data block
154	//
155	// return value: number of bytes we used from datablock
156	// possible cases:
157	// 0 bytes used, 0 samples output (need more data)
158	// N bytes used, 0 samples output (resynching the stream, keep going)
159	// N bytes used, M samples output (one frame of data)
160	// note that after opening a file, you will ALWAYS get one N-bytes,0-sample
161	// frame, because Vorbis always "discards" the first frame.
162	//
163	// Note that on resynch, stb_vorbis will rarely consume all of the buffer,
164	// instead only datablock_length_in_bytes-3 or less. This is because it wants
165	// to avoid missing parts of a page header if they cross a datablock boundary,
166	// without writing state-machiney code to record a partial detection.
167	//
168	// The number of channels returned are stored in *channels (which can be
169	// NULL--it is always the same as the number of channels reported by
170	// get_info). output will contain an array of float buffers, one per
171	// channel. In other words, (*output)[0][0] contains the first sample from
172	// the first channel, and (*output)[1][0] contains the first sample from
173	// the second channel.
174
175	extern void stb_vorbis_flush_pushdata(stb_vorbis *f);
176	// inform stb_vorbis that your next datablock will not be contiguous with
177	// previous ones (e.g. you've seeked in the data); future attempts to decode
178	// frames will cause stb_vorbis to resynchronize (as noted above), and
179	// once it sees a valid Ogg page (typically 4-8KB, as large as 64KB), it
180	// will begin decoding the _next_ frame.
181	//
182	// if you want to seek using pushdata, you need to seek in your file, then
183	// call stb_vorbis_flush_pushdata(), then start calling decoding, then once
184	// decoding is returning you data, call stb_vorbis_get_sample_offset, and
185	// if you don't like the result, seek your file again and repeat.
186	#endif
187
188
189	////////// PULLING INPUT API
190
191	#ifndef STB_VORBIS_NO_PULLDATA_API
192	// This API assumes stb_vorbis is allowed to pull data from a source--
193	// either a block of memory containing the _entire_ vorbis stream, or a
194	// FILE * that you or it create, or possibly some other reading mechanism
195	// if you go modify the source to replace the FILE * case with some kind
196	// of callback to your code. (But if you don't support seeking, you may
197	// just want to go ahead and use pushdata.)
198
199	#if !defined(STB_VORBIS_NO_STDIO) && !defined(STB_VORBIS_NO_INTEGER_CONVERSION)
200	extern int stb_vorbis_decode_filename(char filename, int channels, short **output);
201	#endif
202	extern int stb_vorbis_decode_memory(unsigned char mem, int len, int channels, short **output);
203	// decode an entire file and output the data interleaved into a malloc()ed
204	// buffer stored in *output. The return value is the number of samples
205	// decoded, or -1 if the file could not be opened or was not an ogg vorbis file.
206	// When you're done with it, just free() the pointer returned in *output.
207
208	extern stb_vorbis * stb_vorbis_open_memory(unsigned char *data, int len,
209	int error, stb_vorbis_alloc alloc_buffer);
210	// create an ogg vorbis decoder from an ogg vorbis stream in memory (note
211	// this must be the entire stream!). on failure, returns NULL and sets *error
212
213	#ifndef STB_VORBIS_NO_STDIO
214	extern stb_vorbis * stb_vorbis_open_filename(char *filename,
215	int error, stb_vorbis_alloc alloc_buffer);
216	// create an ogg vorbis decoder from a filename via fopen(). on failure,
217	// returns NULL and sets *error (possibly to VORBIS_file_open_failure).
218
219	extern stb_vorbis * stb_vorbis_open_file(FILE *f, int close_handle_on_close,
220	int error, stb_vorbis_alloc alloc_buffer);
221	// create an ogg vorbis decoder from an open FILE *, looking for a stream at
222	// the _current_ seek point (ftell). on failure, returns NULL and sets *error.
223	// note that stb_vorbis must "own" this stream; if you seek it in between
224	// calls to stb_vorbis, it will become confused. Morever, if you attempt to
225	// perform stb_vorbis_seek_*() operations on this file, it will assume it
226	// owns the _entire_ rest of the file after the start point. Use the next
227	// function, stb_vorbis_open_file_section(), to limit it.
228
229	extern stb_vorbis * stb_vorbis_open_file_section(FILE *f, int close_handle_on_close,
230	int error, stb_vorbis_alloc alloc_buffer, unsigned int len);
231	// create an ogg vorbis decoder from an open FILE *, looking for a stream at
232	// the _current_ seek point (ftell); the stream will be of length 'len' bytes.
233	// on failure, returns NULL and sets *error. note that stb_vorbis must "own"
234	// this stream; if you seek it in between calls to stb_vorbis, it will become
235	// confused.
236	#endif
237
238	extern int stb_vorbis_seek_frame(stb_vorbis *f, unsigned int sample_number);
239	extern int stb_vorbis_seek(stb_vorbis *f, unsigned int sample_number);
240	// NOT WORKING YET
241	// these functions seek in the Vorbis file to (approximately) 'sample_number'.
242	// after calling seek_frame(), the next call to get_frame_*() will include
243	// the specified sample. after calling stb_vorbis_seek(), the next call to
244	// stb_vorbis_get_samples_* will start with the specified sample. If you
245	// do not need to seek to EXACTLY the target sample when using get_samples_*,
246	// you can also use seek_frame().
247
248	extern void stb_vorbis_seek_start(stb_vorbis *f);
249	// this function is equivalent to stb_vorbis_seek(f,0), but it
250	// actually works
251
252	extern unsigned int stb_vorbis_stream_length_in_samples(stb_vorbis *f);
253	extern float stb_vorbis_stream_length_in_seconds(stb_vorbis *f);
254	// these functions return the total length of the vorbis stream
255
256	extern int stb_vorbis_get_frame_float(stb_vorbis f, int channels, float ***output);
257	// decode the next frame and return the number of samples. the number of
258	// channels returned are stored in *channels (which can be NULL--it is always
259	// the same as the number of channels reported by get_info). *output will
260	// contain an array of float* buffers, one per channel. These outputs will
261	// be overwritten on the next call to stb_vorbis_get_frame_*.
262	//
263	// You generally should not intermix calls to stb_vorbis_get_frame_*()
264	// and stb_vorbis_get_samples_*(), since the latter calls the former.
265
266	#ifndef STB_VORBIS_NO_INTEGER_CONVERSION
267	extern int stb_vorbis_get_frame_short_interleaved(stb_vorbis f, int num_c, short buffer, int num_shorts);
268	extern int stb_vorbis_get_frame_short (stb_vorbis f, int num_c, short *buffer, int num_samples);
269	#endif
270	// decode the next frame and return the number of samples per channel. the
271	// data is coerced to the number of channels you request according to the
272	// channel coercion rules (see below). You must pass in the size of your
273	// buffer(s) so that stb_vorbis will not overwrite the end of the buffer.
274	// The maximum buffer size needed can be gotten from get_info(); however,
275	// the Vorbis I specification implies an absolute maximum of 4096 samples
276	// per channel. Note that for interleaved data, you pass in the number of
277	// shorts (the size of your array), but the return value is the number of
278	// samples per channel, not the total number of samples.
279
280	// Channel coercion rules:
281	// Let M be the number of channels requested, and N the number of channels present,
282	// and Cn be the nth channel; let stereo L be the sum of all L and center channels,
283	// and stereo R be the sum of all R and center channels (channel assignment from the
284	// vorbis spec).
285	// M N output
286	// 1 k sum(Ck) for all k
287	// 2 * stereo L, stereo R
288	// k l k > l, the first l channels, then 0s
289	// k l k <= l, the first k channels
290	// Note that this is not _good_ surround etc. mixing at all! It's just so
291	// you get something useful.
292
293	extern int stb_vorbis_get_samples_float_interleaved(stb_vorbis f, int channels, float buffer, int num_floats);
294	extern int stb_vorbis_get_samples_float(stb_vorbis f, int channels, float *buffer, int num_samples);
295	// gets num_samples samples, not necessarily on a frame boundary--this requires
296	// buffering so you have to supply the buffers. DOES NOT APPLY THE COERCION RULES.
297	// Returns the number of samples stored per channel; it may be less than requested
298	// at the end of the file. If there are no more samples in the file, returns 0.
299
300	#ifndef STB_VORBIS_NO_INTEGER_CONVERSION
301	extern int stb_vorbis_get_samples_short_interleaved(stb_vorbis f, int channels, short buffer, int num_shorts);
302	extern int stb_vorbis_get_samples_short(stb_vorbis f, int channels, short *buffer, int num_samples);
303	#endif
304	// gets num_samples samples, not necessarily on a frame boundary--this requires
305	// buffering so you have to supply the buffers. Applies the coercion rules above
306	// to produce 'channels' channels. Returns the number of samples stored per channel;
307	// it may be less than requested at the end of the file. If there are no more
308	// samples in the file, returns 0.
309
310	#endif
311
312	//////// ERROR CODES
313
314	enum STBVorbisError
315	{
316	VORBIS__no_error,
317
318	VORBIS_need_more_data=1, // not a real error
319
320	VORBIS_invalid_api_mixing, // can't mix API modes
321	VORBIS_outofmem, // not enough memory
322	VORBIS_feature_not_supported, // uses floor 0
323	VORBIS_too_many_channels, // STB_VORBIS_MAX_CHANNELS is too small
324	VORBIS_file_open_failure, // fopen() failed
325	VORBIS_seek_without_length, // can't seek in unknown-length file
326
327	VORBIS_unexpected_eof=10, // file is truncated?
328	VORBIS_seek_invalid, // seek past EOF
329
330	// decoding errors (corrupt/invalid stream) -- you probably
331	// don't care about the exact details of these
332
333	// vorbis errors:
334	VORBIS_invalid_setup=20,
335	VORBIS_invalid_stream,
336
337	// ogg errors:
338	VORBIS_missing_capture_pattern=30,
339	VORBIS_invalid_stream_structure_version,
340	VORBIS_continued_packet_flag_invalid,
341	VORBIS_incorrect_stream_serial_number,
342	VORBIS_invalid_first_page,
343	VORBIS_bad_packet_type,
344	VORBIS_cant_find_last_page,
345	VORBIS_seek_failed,
346	};
347
348
349	#ifdef __cplusplus
350	}
351	#endif
352
353	#endif // STB_VORBIS_INCLUDE_STB_VORBIS_H
354	//
355	// HEADER ENDS HERE
356	//
357	//////////////////////////////////////////////////////////////////////////////
358
359	#ifndef STB_VORBIS_HEADER_ONLY
360
361	// global configuration settings (e.g. set these in the project/makefile),
362	// or just set them in this file at the top (although ideally the first few
363	// should be visible when the header file is compiled too, although it's not
364	// crucial)
365
366	// STB_VORBIS_NO_PUSHDATA_API
367	// does not compile the code for the various stb_vorbis_*_pushdata()
368	// functions
369	// #define STB_VORBIS_NO_PUSHDATA_API
370
371	// STB_VORBIS_NO_PULLDATA_API
372	// does not compile the code for the non-pushdata APIs
373	// #define STB_VORBIS_NO_PULLDATA_API
374
375	// STB_VORBIS_NO_STDIO
376	// does not compile the code for the APIs that use FILE *s internally
377	// or externally (implied by STB_VORBIS_NO_PULLDATA_API)
378	// #define STB_VORBIS_NO_STDIO
379
380	// STB_VORBIS_NO_INTEGER_CONVERSION
381	// does not compile the code for converting audio sample data from
382	// float to integer (implied by STB_VORBIS_NO_PULLDATA_API)
383	// #define STB_VORBIS_NO_INTEGER_CONVERSION
384
385	// STB_VORBIS_NO_FAST_SCALED_FLOAT
386	// does not use a fast float-to-int trick to accelerate float-to-int on
387	// most platforms which requires endianness be defined correctly.
388	//#define STB_VORBIS_NO_FAST_SCALED_FLOAT
389
390
391	// STB_VORBIS_MAX_CHANNELS [number]
392	// globally define this to the maximum number of channels you need.
393	// The spec does not put a restriction on channels except that
394	// the count is stored in a byte, so 255 is the hard limit.
395	// Reducing this saves about 16 bytes per value, so using 16 saves
396	// (255-16)*16 or around 4KB. Plus anything other memory usage
397	// I forgot to account for. Can probably go as low as 8 (7.1 audio),
398	// 6 (5.1 audio), or 2 (stereo only).
399	#ifndef STB_VORBIS_MAX_CHANNELS16
400	#define STB_VORBIS_MAX_CHANNELS16 16 // enough for anyone?
401	#endif
402
403	// STB_VORBIS_PUSHDATA_CRC_COUNT [number]
404	// after a flush_pushdata(), stb_vorbis begins scanning for the
405	// next valid page, without backtracking. when it finds something
406	// that looks like a page, it streams through it and verifies its
407	// CRC32. Should that validation fail, it keeps scanning. But it's
408	// possible that _while_ streaming through to check the CRC32 of
409	// one candidate page, it sees another candidate page. This #define
410	// determines how many "overlapping" candidate pages it can search
411	// at once. Note that "real" pages are typically ~4KB to ~8KB, whereas
412	// garbage pages could be as big as 64KB, but probably average ~16KB.
413	// So don't hose ourselves by scanning an apparent 64KB page and
414	// missing a ton of real ones in the interim; so minimum of 2
415	#ifndef STB_VORBIS_PUSHDATA_CRC_COUNT4
416	#define STB_VORBIS_PUSHDATA_CRC_COUNT4 4
417	#endif
418
419	// STB_VORBIS_FAST_HUFFMAN_LENGTH [number]
420	// sets the log size of the huffman-acceleration table. Maximum
421	// supported value is 24. with larger numbers, more decodings are O(1),
422	// but the table size is larger so worse cache missing, so you'll have
423	// to probe (and try multiple ogg vorbis files) to find the sweet spot.
424	#ifndef STB_VORBIS_FAST_HUFFMAN_LENGTH10
425	#define STB_VORBIS_FAST_HUFFMAN_LENGTH10 10
426	#endif
427
428	// STB_VORBIS_FAST_BINARY_LENGTH [number]
429	// sets the log size of the binary-search acceleration table. this
430	// is used in similar fashion to the fast-huffman size to set initial
431	// parameters for the binary search
432
433	// STB_VORBIS_FAST_HUFFMAN_INT
434	// The fast huffman tables are much more efficient if they can be
435	// stored as 16-bit results instead of 32-bit results. This restricts
436	// the codebooks to having only 65535 possible outcomes, though.
437	// (At least, accelerated by the huffman table.)
438	#ifndef STB_VORBIS_FAST_HUFFMAN_INT
439	#define STB_VORBIS_FAST_HUFFMAN_SHORT
440	#endif
441
442	// STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH
443	// If the 'fast huffman' search doesn't succeed, then stb_vorbis falls
444	// back on binary searching for the correct one. This requires storing
445	// extra tables with the huffman codes in sorted order. Defining this
446	// symbol trades off space for speed by forcing a linear search in the
447	// non-fast case, except for "sparse" codebooks.
448	// #define STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH
449
450	// STB_VORBIS_DIVIDES_IN_RESIDUE
451	// stb_vorbis precomputes the result of the scalar residue decoding
452	// that would otherwise require a divide per chunk. you can trade off
453	// space for time by defining this symbol.
454	// #define STB_VORBIS_DIVIDES_IN_RESIDUE
455
456	// STB_VORBIS_DIVIDES_IN_CODEBOOK
457	// vorbis VQ codebooks can be encoded two ways: with every case explicitly
458	// stored, or with all elements being chosen from a small range of values,
459	// and all values possible in all elements. By default, stb_vorbis expands
460	// this latter kind out to look like the former kind for ease of decoding,
461	// because otherwise an integer divide-per-vector-element is required to
462	// unpack the index. If you define STB_VORBIS_DIVIDES_IN_CODEBOOK, you can
463	// trade off storage for speed.
464	//#define STB_VORBIS_DIVIDES_IN_CODEBOOK
465
466	// STB_VORBIS_CODEBOOK_SHORTS
467	// The vorbis file format encodes VQ codebook floats as ax+b where a and
468	// b are floating point per-codebook constants, and x is a 16-bit int.
469	// Normally, stb_vorbis decodes them to floats rather than leaving them
470	// as 16-bit ints and computing ax+b while decoding. This is a speed/space
471	// tradeoff; you can save space by defining this flag.
472	#ifndef STB_VORBIS_CODEBOOK_SHORTS
473	#define STB_VORBIS_CODEBOOK_FLOATS
474	#endif
475
476	// STB_VORBIS_DIVIDE_TABLE
477	// this replaces small integer divides in the floor decode loop with
478	// table lookups. made less than 1% difference, so disabled by default.
479
480	// STB_VORBIS_NO_INLINE_DECODE
481	// disables the inlining of the scalar codebook fast-huffman decode.
482	// might save a little codespace; useful for debugging
483	// #define STB_VORBIS_NO_INLINE_DECODE
484
485	// STB_VORBIS_NO_DEFER_FLOOR
486	// Normally we only decode the floor without synthesizing the actual
487	// full curve. We can instead synthesize the curve immediately. This
488	// requires more memory and is very likely slower, so I don't think
489	// you'd ever want to do it except for debugging.
490	// #define STB_VORBIS_NO_DEFER_FLOOR
491
492
493
494
495	//////////////////////////////////////////////////////////////////////////////
496
497	#ifdef STB_VORBIS_NO_PULLDATA_API
498	#define STB_VORBIS_NO_INTEGER_CONVERSION
499	#define STB_VORBIS_NO_STDIO
500	#endif
501
502	#if defined(STB_VORBIS_NO_CRT) && !defined(STB_VORBIS_NO_STDIO)
503	#define STB_VORBIS_NO_STDIO 1
504	#endif
505
506	#ifndef STB_VORBIS_NO_INTEGER_CONVERSION
507	#ifndef STB_VORBIS_NO_FAST_SCALED_FLOAT
508
509	// only need endianness for fast-float-to-int, which we don't
510	// use for pushdata
511
512	#ifndef STB_VORBIS_BIG_ENDIAN
513	#define STB_VORBIS_ENDIAN0 0
514	#else
515	#define STB_VORBIS_ENDIAN0 1
516	#endif
517
518	#endif
519	#endif
520
521
522	#ifndef STB_VORBIS_NO_STDIO
523	#include <stdio.h>
524	#endif
525
526	#ifndef STB_VORBIS_NO_CRT
527	#include <stdlib.h>
528	#include <string.h>
529	#include <assert.h>
530	#include <math.h>
531	#else
532	#define NULL((void*)0) 0
533	#endif
534
535	#ifndef _MSC_VER
536	#if __GNUC__4
537	#define __forceinlineinline inline
538	#else
539	#define __forceinlineinline
540	#endif
541	#endif
542
543	#if STB_VORBIS_MAX_CHANNELS16 > 256
544	#error "Value of STB_VORBIS_MAX_CHANNELS outside of allowed range"
545	#endif
546
547	#if STB_VORBIS_FAST_HUFFMAN_LENGTH10 > 24
548	#error "Value of STB_VORBIS_FAST_HUFFMAN_LENGTH outside of allowed range"
549	#endif
550
551
552	#define MAX_BLOCKSIZE_LOG13 13 // from specification
553	#define MAX_BLOCKSIZE(1 << 13) (1 << MAX_BLOCKSIZE_LOG13)
554
555
556	typedef unsigned char uint8;
557	typedef signed char int8;
558	typedef unsigned short uint16;
559	typedef signed short int16;
560	typedef unsigned int uint32;
561	typedef signed int int32;
562
563	#ifndef TRUE1
564	#define TRUE1 1
565	#define FALSE0 0
566	#endif
567
568	#ifdef STB_VORBIS_CODEBOOK_FLOATS
569	typedef float codetype;
570	#else
571	typedef uint16 codetype;
572	#endif
573
574	// @NOTE
575	//
576	// Some arrays below are tagged "//varies", which means it's actually
577	// a variable-sized piece of data, but rather than malloc I assume it's
578	// small enough it's better to just allocate it all together with the
579	// main thing
580	//
581	// Most of the variables are specified with the smallest size I could pack
582	// them into. It might give better performance to make them all full-sized
583	// integers. It should be safe to freely rearrange the structures or change
584	// the sizes larger--nothing relies on silently truncating etc., nor the
585	// order of variables.
586
587	#define FAST_HUFFMAN_TABLE_SIZE(1 << 10) (1 << STB_VORBIS_FAST_HUFFMAN_LENGTH10)
588	#define FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1) (FAST_HUFFMAN_TABLE_SIZE(1 << 10) - 1)
589
590	typedef struct
591	{
592	int dimensions, entries;
593	uint8 *codeword_lengths;
594	float minimum_value;
595	float delta_value;
596	uint8 value_bits;
597	uint8 lookup_type;
598	uint8 sequence_p;
599	uint8 sparse;
600	uint32 lookup_values;
601	codetype *multiplicands;
602	uint32 *codewords;
603	#ifdef STB_VORBIS_FAST_HUFFMAN_SHORT
604	int16 fast_huffman[FAST_HUFFMAN_TABLE_SIZE(1 << 10)];
605	#else
606	int32 fast_huffman[FAST_HUFFMAN_TABLE_SIZE(1 << 10)];
607	#endif
608	uint32 *sorted_codewords;
609	int *sorted_values;
610	int sorted_entries;
611	} Codebook;
612
613	typedef struct
614	{
615	uint8 order;
616	uint16 rate;
617	uint16 bark_map_size;
618	uint8 amplitude_bits;
619	uint8 amplitude_offset;
620	uint8 number_of_books;
621	uint8 book_list[16]; // varies
622	} Floor0;
623
624	typedef struct
625	{
626	uint8 partitions;
627	uint8 partition_class_list[32]; // varies
628	uint8 class_dimensions[16]; // varies
629	uint8 class_subclasses[16]; // varies
630	uint8 class_masterbooks[16]; // varies
631	int16 subclass_books[16][8]; // varies
632	uint16 Xlist[31*8+2]; // varies
633	uint8 sorted_order[31*8+2];
634	uint8 neighbors[31*8+2][2];
635	uint8 floor1_multiplier;
636	uint8 rangebits;
637	int values;
638	} Floor1;
639
640	typedef union
641	{
642	Floor0 floor0;
643	Floor1 floor1;
644	} Floor;
645
646	typedef struct
647	{
648	uint32 begin, end;
649	uint32 part_size;
650	uint8 classifications;
651	uint8 classbook;
652	uint8 **classdata;
653	int16 (*residue_books)[8];
654	} Residue;
655
656	typedef struct
657	{
658	uint8 magnitude;
659	uint8 angle;
660	uint8 mux;
661	} MappingChannel;
662
663	typedef struct
664	{
665	uint16 coupling_steps;
666	MappingChannel *chan;
667	uint8 submaps;
668	uint8 submap_floor[15]; // varies
669	uint8 submap_residue[15]; // varies
670	} Mapping;
671
672	typedef struct
673	{
674	uint8 blockflag;
675	uint8 mapping;
676	uint16 windowtype;
677	uint16 transformtype;
678	} Mode;
679
680	typedef struct
681	{
682	uint32 goal_crc; // expected crc if match
683	int bytes_left; // bytes left in packet
684	uint32 crc_so_far; // running crc
685	int bytes_done; // bytes processed in _current_ chunk
686	uint32 sample_loc; // granule pos encoded in page
687	} CRCscan;
688
689	typedef struct
690	{
691	uint32 page_start, page_end;
692	uint32 after_previous_page_start;
693	uint32 first_decoded_sample;
694	uint32 last_decoded_sample;
695	} ProbedPage;
696
697	struct stb_vorbis
698	{
699	// user-accessible info
700	unsigned int sample_rate;
701	int channels;
702
703	unsigned int setup_memory_required;
704	unsigned int temp_memory_required;
705	unsigned int setup_temp_memory_required;
706
707	// input config
708	#ifndef STB_VORBIS_NO_STDIO
709	FILE *f;
710	uint32 f_start;
711	int close_on_free;
712	#endif
713
714	uint8 *stream;
715	uint8 *stream_start;
716	uint8 *stream_end;
717
718	uint32 stream_len;
719
720	uint8 push_mode;
721
722	uint32 first_audio_page_offset;
723
724	ProbedPage p_first, p_last;
725
726	// memory management
727	stb_vorbis_alloc alloc;
728	int setup_offset;
729	int temp_offset;
730
731	// run-time results
732	int eof;
733	enum STBVorbisError error;
734
735	// user-useful data
736
737	// header info
738	int blocksize[2];
739	int blocksize_0, blocksize_1;
740	int codebook_count;
741	Codebook *codebooks;
742	int floor_count;
743	uint16 floor_types[64]; // varies
744	Floor *floor_config;
745	int residue_count;
746	uint16 residue_types[64]; // varies
747	Residue *residue_config;
748	int mapping_count;
749	Mapping *mapping;
750	int mode_count;
751	Mode mode_config[64]; // varies
752
753	uint32 total_samples;
754
755	// decode buffer
756	float *channel_buffers[STB_VORBIS_MAX_CHANNELS16];
757	float *outputs [STB_VORBIS_MAX_CHANNELS16];
758
759	float *previous_window[STB_VORBIS_MAX_CHANNELS16];
760	int previous_length;
761
762	#ifndef STB_VORBIS_NO_DEFER_FLOOR
763	int16 *finalY[STB_VORBIS_MAX_CHANNELS16];
764	#else
765	float *floor_buffers[STB_VORBIS_MAX_CHANNELS16];
766	#endif
767
768	uint32 current_loc; // sample location of next frame to decode
769	int current_loc_valid;
770
771	// per-blocksize precomputed data
772
773	// twiddle factors
774	float A[2],B[2],*C(2 \| 4 \| 1)[2];
775	float *window[2];
776	uint16 *bit_reverse[2];
777
778	// current page/packet/segment streaming info
779	uint32 serial; // stream serial number for verification
780	int last_page;
781	int segment_count;
782	uint8 segments[255];
783	uint8 page_flag;
784	uint8 bytes_in_seg;
785	uint8 first_decode;
786	int next_seg;
787	int last_seg; // flag that we're on the last segment
788	int last_seg_which; // what was the segment number of the last seg?
789	uint32 acc;
790	int valid_bits;
791	int packet_bytes;
792	int end_seg_with_known_loc;
793	uint32 known_loc_for_packet;
794	int discard_samples_deferred;
795	uint32 samples_output;
796
797	// push mode scanning
798	int page_crc_tests; // only in push_mode: number of tests active; -1 if not searching
799	#ifndef STB_VORBIS_NO_PUSHDATA_API
800	CRCscan scan[STB_VORBIS_PUSHDATA_CRC_COUNT4];
801	#endif
802
803	// sample-access
804	int channel_buffer_start;
805	int channel_buffer_end;
806	};
807
808	extern int my_prof(int slot);
809	//#define stb_prof my_prof
810
811	#ifndef stb_prof
812	#define stb_prof(x)(void)0 (void)0
813	#endif
814
815	#if defined(STB_VORBIS_NO_PUSHDATA_API)
816	#define IS_PUSH_MODE(f)((f)->push_mode) FALSE0
817	#elif defined(STB_VORBIS_NO_PULLDATA_API)
818	#define IS_PUSH_MODE(f)((f)->push_mode) TRUE1
819	#else
820	#define IS_PUSH_MODE(f)((f)->push_mode) ((f)->push_mode)
821	#endif
822
823	typedef struct stb_vorbis vorb;
824
825	static int error(vorb *f, enum STBVorbisError e)
826	{
827	f->error = e;
828	if (!f->eof && e != VORBIS_need_more_data) {
829	f->error=e; // breakpoint for debugging
830	}
831	return 0;
832	}
833
834
835	// these functions are used for allocating temporary memory
836	// while decoding. if you can afford the stack space, use
837	// alloca(); otherwise, provide a temp buffer and it will
838	// allocate out of those.
839
840	#define array_size_required(count,size)(count(sizeof(void )+(size))) (count(sizeof(void )+(size)))
841
842	#define temp_alloc(f,size)(f->alloc.alloc_buffer ? setup_temp_malloc(f,size) : alloca (size)) (f->alloc.alloc_buffer ? setup_temp_malloc(f,size) : alloca(size))
843	#ifdef dealloca
844	#define temp_free(f,p)0 (f->alloc.alloc_buffer ? 0 : dealloca(size))
845	#else
846	#define temp_free(f,p)0 0
847	#endif
848	#define temp_alloc_save(f)((f)->temp_offset) ((f)->temp_offset)
849	#define temp_alloc_restore(f,p)((f)->temp_offset = (p)) ((f)->temp_offset = (p))
850
851	#define temp_block_array(f,count,size)make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(count(sizeof(void )+(size)))) : alloca((count(sizeof(void )+(size))))), count, size) make_block_array(temp_alloc(f,array_size_required(count,size))(f->alloc.alloc_buffer ? setup_temp_malloc(f,(count(sizeof (void )+(size)))) : alloca((count(sizeof(void )+(size))))), count, size)
852
853	// given a sufficiently large block of memory, make an array of pointers to subblocks of it
854	static void make_block_array(void mem, int count, int size)
855	{
856	int i;
857	void p = (void ) mem;
858	char q = (char ) (p + count);
859	for (i=0; i < count; ++i) {
860	p[i] = q;
861	q += size;
862	}
863	return p;
864	}
865
866	static void setup_malloc(vorb f, int sz)
867	{
868	sz = (sz+3) & ~3;
869	f->setup_memory_required += sz;
870	if (f->alloc.alloc_buffer) {
871	void p = (char ) f->alloc.alloc_buffer + f->setup_offset;
872	if (f->setup_offset + sz > f->temp_offset) return NULL((void*)0);
873	f->setup_offset += sz;
874	return p;
875	}
876	return sz ? malloc(sz) : NULL((void*)0);
877	}
878
879	static void setup_free(vorb f, void p)
880	{
881	if (f->alloc.alloc_buffer) return; // do nothing; setup mem is not a stack
882	free(p);
883	}
884
885	static void setup_temp_malloc(vorb f, int sz)
886	{
887	sz = (sz+3) & ~3;
888	if (f->alloc.alloc_buffer) {
889	if (f->temp_offset - sz < f->setup_offset) return NULL((void*)0);
890	f->temp_offset -= sz;
891	return (char *) f->alloc.alloc_buffer + f->temp_offset;
892	}
893	return malloc(sz);
894	}
895
896	static void setup_temp_free(vorb f, void p, size_t sz)
897	{
898	if (f->alloc.alloc_buffer) {
899	f->temp_offset += (sz+3)&~3;
900	return;
901	}
902	free(p);
903	}
904
905	#define CRC32_POLY0x04c11db7 0x04c11db7 // from spec
906
907	static uint32 crc_table[256];
908	static void crc32_init(void)
909	{
910	int i,j;
911	uint32 s;
912	for(i=0; i < 256; i++) {
913	for (s=i<<24, j=0; j < 8; ++j)
914	s = (s << 1) ^ (s >= (1<<31) ? CRC32_POLY0x04c11db7 : 0);
915	crc_table[i] = s;
916	}
917	}
918
919	static __forceinlineinline uint32 crc32_update(uint32 crc, uint8 byte)
920	{
921	return (crc << 8) ^ crc_table[byte ^ (crc >> 24)];
922	}
923
924
925	// used in setup, and for huffman that doesn't go fast path
926	static unsigned int bit_reverse(unsigned int n)
927	{
928	n = ((n & 0xAAAAAAAA) >> 1) \| ((n & 0x55555555) << 1);
929	n = ((n & 0xCCCCCCCC) >> 2) \| ((n & 0x33333333) << 2);
930	n = ((n & 0xF0F0F0F0) >> 4) \| ((n & 0x0F0F0F0F) << 4);
931	n = ((n & 0xFF00FF00) >> 8) \| ((n & 0x00FF00FF) << 8);
932	return (n >> 16) \| (n << 16);
933	}
934
935	static float square(float x)
936	{
937	return x*x;
938	}
939
940	// this is a weird definition of log2() for which log2(1) = 1, log2(2) = 2, log2(4) = 3
941	// as required by the specification. fast(?) implementation from stb.h
942	// @OPTIMIZE: called multiple times per-packet with "constants"; move to setup
943	static int ilog(int32 n)
944	{
945	static signed char log2_4[16] = { 0,1,2,2,3,3,3,3,4,4,4,4,4,4,4,4 };
946
947	// 2 compares if n < 16, 3 compares otherwise (4 if signed or n > 1<<29)
948	if (n < (1U << 14))
949	if (n < (1U << 4)) return 0 + log2_4[n ];
950	else if (n < (1U << 9)) return 5 + log2_4[n >> 5];
951	else return 10 + log2_4[n >> 10];
952	else if (n < (1U << 24))
953	if (n < (1U << 19)) return 15 + log2_4[n >> 15];
954	else return 20 + log2_4[n >> 20];
955	else if (n < (1U << 29)) return 25 + log2_4[n >> 25];
956	else if (n < (1U << 31)) return 30 + log2_4[n >> 30];
957	else return 0; // signed n returns 0
958	}
959
960	#ifndef M_PI3.14159265358979323846
961	#define M_PI3.14159265358979323846 3.14159265358979323846264f // from CRC
962	#endif
963
964	// code length assigned to a value with no huffman encoding
965	#define NO_CODE255 255
966
967	/////////////////////// LEAF SETUP FUNCTIONS //////////////////////////
968	//
969	// these functions are only called at setup, and only a few times
970	// per file
971
972	static float float32_unpack(uint32 x)
973	{
974	// from the specification
975	uint32 mantissa = x & 0x1fffff;
976	uint32 sign = x & 0x80000000;
977	uint32 exp = (x & 0x7fe00000) >> 21;
978	double res = sign ? -(double)mantissa : (double)mantissa;
979	return (float) ldexp((float)res, exp-788);
980	}
981
982
983	// zlib & jpeg huffman tables assume that the output symbols
984	// can either be arbitrarily arranged, or have monotonically
985	// increasing frequencies--they rely on the lengths being sorted;
986	// this makes for a very simple generation algorithm.
987	// vorbis allows a huffman table with non-sorted lengths. This
988	// requires a more sophisticated construction, since symbols in
989	// order do not map to huffman codes "in order".
990	static void add_entry(Codebook c, uint32 huff_code, int symbol, int count, int len, uint32 values)
991	{
992	if (!c->sparse) {
993	c->codewords [symbol] = huff_code;
994	} else {
995	c->codewords [count] = huff_code;
996	c->codeword_lengths[count] = len;
997	values [count] = symbol;
998	}
999	}
1000
1001	static int compute_codewords(Codebook c, uint8 len, int n, uint32 *values)
1002	{
1003	int i,k,m=0;
1004	uint32 available[32];
1005
1006	memset(available, 0, sizeof(available));
1007	// find the first entry
1008	for (k=0; k < n; ++k) if (len[k] < NO_CODE255) break;
1009	if (k == n) { assert(c->sorted_entries == 0)((c->sorted_entries == 0) ? (void)0 : _assert("c->sorted_entries == 0" , "src/siege/internal/stb/stb_vorbis.c", 1009)); return TRUE1; }
1010	// add to the list
1011	add_entry(c, 0, k, m++, len[k], values);
1012	// add all available leaves
1013	for (i=1; i <= len[k]; ++i)
1014	available[i] = 1 << (32-i);
1015	// note that the above code treats the first case specially,
1016	// but it's really the same as the following code, so they
1017	// could probably be combined (except the initial code is 0,
1018	// and I use 0 in available[] to mean 'empty')
1019	for (i=k+1; i < n; ++i) {
1020	uint32 res;
1021	int z = len[i], y;
1022	if (z == NO_CODE255) continue;
1023	// find lowest available leaf (should always be earliest,
1024	// which is what the specification calls for)
1025	// note that this property, and the fact we can never have
1026	// more than one free leaf at a given level, isn't totally
1027	// trivial to prove, but it seems true and the assert never
1028	// fires, so!
1029	while (z > 0 && !available[z]) --z;
1030	if (z == 0) { assert(0)((0) ? (void)0 : _assert("0", "src/siege/internal/stb/stb_vorbis.c" , 1030)); return FALSE0; }
1031	res = available[z];
1032	available[z] = 0;
1033	add_entry(c, bit_reverse(res), i, m++, len[i], values);
1034	// propogate availability up the tree
1035	if (z != len[i]) {
1036	for (y=len[i]; y > z; --y) {
1037	assert(available[y] == 0)((available[y] == 0) ? (void)0 : _assert("available[y] == 0", "src/siege/internal/stb/stb_vorbis.c", 1037));
1038	available[y] = res + (1 << (32-y));
1039	}
1040	}
1041	}
1042	return TRUE1;
1043	}
1044
1045	// accelerated huffman table allows fast O(1) match of all symbols
1046	// of length <= STB_VORBIS_FAST_HUFFMAN_LENGTH
1047	static void compute_accelerated_huffman(Codebook *c)
1048	{
1049	int i, len;
1050	for (i=0; i < FAST_HUFFMAN_TABLE_SIZE(1 << 10); ++i)
1051	c->fast_huffman[i] = -1;
1052
1053	len = c->sparse ? c->sorted_entries : c->entries;
1054	#ifdef STB_VORBIS_FAST_HUFFMAN_SHORT
1055	if (len > 32767) len = 32767; // largest possible value we can encode!
1056	#endif
1057	for (i=0; i < len; ++i) {
1058	if (c->codeword_lengths[i] <= STB_VORBIS_FAST_HUFFMAN_LENGTH10) {
1059	uint32 z = c->sparse ? bit_reverse(c->sorted_codewords[i]) : c->codewords[i];
1060	// set table entries for all bit combinations in the higher bits
1061	while (z < FAST_HUFFMAN_TABLE_SIZE(1 << 10)) {
1062	c->fast_huffman[z] = i;
1063	z += 1 << c->codeword_lengths[i];
1064	}
1065	}
1066	}
1067	}
1068
1069	static int uint32_compare(const void p, const void q)
1070	{
1071	uint32 x = * (uint32 *) p;
1072	uint32 y = * (uint32 *) q;
1073	return x < y ? -1 : x > y;
1074	}
1075
1076	static int include_in_sort(Codebook *c, uint8 len)
1077	{
1078	if (c->sparse) { assert(len != NO_CODE)((len != 255) ? (void)0 : _assert("len != NO_CODE", "src/siege/internal/stb/stb_vorbis.c" , 1078)); return TRUE1; }
1079	if (len == NO_CODE255) return FALSE0;
1080	if (len > STB_VORBIS_FAST_HUFFMAN_LENGTH10) return TRUE1;
1081	return FALSE0;
1082	}
1083
1084	// if the fast table above doesn't work, we want to binary
1085	// search them... need to reverse the bits
1086	static void compute_sorted_huffman(Codebook c, uint8 lengths, uint32 *values)
1087	{
1088	int i, len;
1089	// build a list of all the entries
1090	// OPTIMIZATION: don't include the short ones, since they'll be caught by FAST_HUFFMAN.
1091	// this is kind of a frivolous optimization--I don't see any performance improvement,
1092	// but it's like 4 extra lines of code, so.
1093	if (!c->sparse) {
1094	int k = 0;
1095	for (i=0; i < c->entries; ++i)
1096	if (include_in_sort(c, lengths[i]))
1097	c->sorted_codewords[k++] = bit_reverse(c->codewords[i]);
1098	assert(k == c->sorted_entries)((k == c->sorted_entries) ? (void)0 : _assert("k == c->sorted_entries" , "src/siege/internal/stb/stb_vorbis.c", 1098));
1099	} else {
1100	for (i=0; i < c->sorted_entries; ++i)
1101	c->sorted_codewords[i] = bit_reverse(c->codewords[i]);
1102	}
1103
1104	qsort(c->sorted_codewords, c->sorted_entries, sizeof(c->sorted_codewords[0]), uint32_compare);
1105	c->sorted_codewords[c->sorted_entries] = 0xffffffff;
1106
1107	len = c->sparse ? c->sorted_entries : c->entries;
1108	// now we need to indicate how they correspond; we could either
1109	// #1: sort a different data structure that says who they correspond to
1110	// #2: for each sorted entry, search the original list to find who corresponds
1111	// #3: for each original entry, find the sorted entry
1112	// #1 requires extra storage, #2 is slow, #3 can use binary search!
1113	for (i=0; i < len; ++i) {
1114	int huff_len = c->sparse ? lengths[values[i]] : lengths[i];
1115	if (include_in_sort(c,huff_len)) {
1116	uint32 code = bit_reverse(c->codewords[i]);
1117	int x=0, n=c->sorted_entries;
1118	while (n > 1) {
1119	// invariant: sc[x] <= code < sc[x+n]
1120	int m = x + (n >> 1);
1121	if (c->sorted_codewords[m] <= code) {
1122	x = m;
1123	n -= (n>>1);
1124	} else {
1125	n >>= 1;
1126	}
1127	}
1128	assert(c->sorted_codewords[x] == code)((c->sorted_codewords[x] == code) ? (void)0 : _assert("c->sorted_codewords[x] == code" , "src/siege/internal/stb/stb_vorbis.c", 1128));
1129	if (c->sparse) {
1130	c->sorted_values[x] = values[i];
1131	c->codeword_lengths[x] = huff_len;
1132	} else {
1133	c->sorted_values[x] = i;
1134	}
1135	}
1136	}
1137	}
1138
1139	// only run while parsing the header (3 times)
1140	static int vorbis_validate(uint8 *data)
1141	{
1142	static uint8 vorbis[6] = { 'v', 'o', 'r', 'b', 'i', 's' };
1143	return memcmp(data, vorbis, 6) == 0;
1144	}
1145
1146	// called from setup only, once per code book
1147	// (formula implied by specification)
1148	static int lookup1_values(int entries, int dim)
1149	{
1150	int r = (int) floor(exp((float) log((float) entries) / dim));
1151	if ((int) floor(pow((float) r+1, dim)) <= entries) // (int) cast for MinGW warning;
1152	++r; // floor() to avoid _ftol() when non-CRT
1153	assert(pow((float) r+1, dim) > entries)((pow((float) r+1, dim) > entries) ? (void)0 : _assert("pow((float) r+1, dim) > entries" , "src/siege/internal/stb/stb_vorbis.c", 1153));
1154	assert((int) floor(pow((float) r, dim)) <= entries)(((int) floor(pow((float) r, dim)) <= entries) ? (void)0 : _assert("(int) floor(pow((float) r, dim)) <= entries", "src/siege/internal/stb/stb_vorbis.c" , 1154)); // (int),floor() as above
1155	return r;
1156	}
1157
1158	// called twice per file
1159	static void compute_twiddle_factors(int n, float A, float B, float *C(2 \| 4 \| 1))
1160	{
1161	int n4 = n >> 2, n8 = n >> 3;
1162	int k,k2;
1163
1164	for (k=k2=0; k < n4; ++k,k2+=2) {
1165	A[k2 ] = (float) cos(4kM_PI3.14159265358979323846/n);
1166	A[k2+1] = (float) -sin(4kM_PI3.14159265358979323846/n);
1167	B[k2 ] = (float) cos((k2+1)M_PI3.14159265358979323846/n/2) 0.5f;
1168	B[k2+1] = (float) sin((k2+1)M_PI3.14159265358979323846/n/2) 0.5f;
1169	}
1170	for (k=k2=0; k < n8; ++k,k2+=2) {
1171	C(2 \| 4 \| 1)[k2 ] = (float) cos(2(k2+1)M_PI3.14159265358979323846/n);
1172	C(2 \| 4 \| 1)[k2+1] = (float) -sin(2(k2+1)M_PI3.14159265358979323846/n);
1173	}
1174	}
1175
1176	static void compute_window(int n, float *window)
1177	{
1178	int n2 = n >> 1, i;
1179	for (i=0; i < n2; ++i)
1180	window[i] = (float) sin(0.5 * M_PI3.14159265358979323846 * square((float) sin((i - 0 + 0.5) / n2 * 0.5 * M_PI3.14159265358979323846)));
1181	}
1182
1183	static void compute_bitreverse(int n, uint16 *rev)
1184	{
1185	int ld = ilog(n) - 1; // ilog is off-by-one from normal definitions
1186	int i, n8 = n >> 3;
1187	for (i=0; i < n8; ++i)
1188	rev[i] = (bit_reverse(i) >> (32-ld+3)) << 2;
1189	}
1190
1191	static int init_blocksize(vorb *f, int b, int n)
1192	{
1193	int n2 = n >> 1, n4 = n >> 2, n8 = n >> 3;
1194	f->A[b] = (float ) setup_malloc(f, sizeof(float) n2);
1195	f->B[b] = (float ) setup_malloc(f, sizeof(float) n2);
1196	f->C(2 \| 4 \| 1)[b] = (float ) setup_malloc(f, sizeof(float) n4);
1197	if (!f->A[b] \|\| !f->B[b] \|\| !f->C(2 \| 4 \| 1)[b]) return error(f, VORBIS_outofmem);
1198	compute_twiddle_factors(n, f->A[b], f->B[b], f->C(2 \| 4 \| 1)[b]);
1199	f->window[b] = (float ) setup_malloc(f, sizeof(float) n2);
1200	if (!f->window[b]) return error(f, VORBIS_outofmem);
1201	compute_window(n, f->window[b]);
1202	f->bit_reverse[b] = (uint16 ) setup_malloc(f, sizeof(uint16) n8);
1203	if (!f->bit_reverse[b]) return error(f, VORBIS_outofmem);
1204	compute_bitreverse(n, f->bit_reverse[b]);
1205	return TRUE1;
1206	}
1207
1208	static void neighbors(uint16 x, int n, int plow, int *phigh)
1209	{
1210	int low = -1;
1211	int high = 65536;
1212	int i;
1213	for (i=0; i < n; ++i) {
1214	if (x[i] > low && x[i] < x[n]) { *plow = i; low = x[i]; }
1215	if (x[i] < high && x[i] > x[n]) { *phigh = i; high = x[i]; }
1216	}
1217	}
1218
1219	// this has been repurposed so y is now the original index instead of y
1220	typedef struct
1221	{
1222	uint16 x,y;
1223	} Point;
1224
1225	int point_compare(const void p, const void q)
1226	{
1227	Point a = (Point ) p;
1228	Point b = (Point ) q;
1229	return a->x < b->x ? -1 : a->x > b->x;
1230	}
1231
1232	//
1233	/////////////////////// END LEAF SETUP FUNCTIONS //////////////////////////
1234
1235
1236	#if defined(STB_VORBIS_NO_STDIO)
1237	#define USE_MEMORY(z)((z)->stream) TRUE1
1238	#else
1239	#define USE_MEMORY(z)((z)->stream) ((z)->stream)
1240	#endif
1241
1242	static uint8 get8(vorb *z)
1243	{
1244	if (USE_MEMORY(z)((z)->stream)) {
1245	if (z->stream >= z->stream_end) { z->eof = TRUE1; return 0; }
1246	return *z->stream++;
1247	}
1248
1249	#ifndef STB_VORBIS_NO_STDIO
1250	{
1251	int c = fgetc(z->f);
1252	if (c == EOF(-1)) { z->eof = TRUE1; return 0; }
1253	return c;
1254	}
1255	#endif
1256	}
1257
1258	static uint32 get32(vorb *f)
1259	{
1260	uint32 x;
1261	x = get8(f);
1262	x += get8(f) << 8;
1263	x += get8(f) << 16;
1264	x += get8(f) << 24;
1265	return x;
1266	}
1267
1268	static int getn(vorb z, uint8 data, int n)
1269	{
1270	if (USE_MEMORY(z)((z)->stream)) {
1271	if (z->stream+n > z->stream_end) { z->eof = 1; return 0; }
1272	memcpy(data, z->stream, n);
1273	z->stream += n;
1274	return 1;
1275	}
1276
1277	#ifndef STB_VORBIS_NO_STDIO
1278	if (fread(data, n, 1, z->f) == 1)
1279	return 1;
1280	else {
1281	z->eof = 1;
1282	return 0;
1283	}
1284	#endif
1285	}
1286
1287	static void skip(vorb *z, int n)
1288	{
1289	if (USE_MEMORY(z)((z)->stream)) {
1290	z->stream += n;
1291	if (z->stream >= z->stream_end) z->eof = 1;
1292	return;
1293	}
1294	#ifndef STB_VORBIS_NO_STDIO
1295	{
1296	long x = ftell(z->f);
1297	fseek(z->f, x+n, SEEK_SET0);
1298	}
1299	#endif
1300	}
1301
1302	static int set_file_offset(stb_vorbis *f, unsigned int loc)
1303	{
1304	#ifndef STB_VORBIS_NO_PUSHDATA_API
1305	if (f->push_mode) return 0;
1306	#endif
1307	f->eof = 0;
1308	if (USE_MEMORY(f)((f)->stream)) {
1309	if (f->stream_start + loc >= f->stream_end \|\| f->stream_start + loc < f->stream_start) {
1310	f->stream = f->stream_end;
1311	f->eof = 1;
1312	return 0;
1313	} else {
1314	f->stream = f->stream_start + loc;
1315	return 1;
1316	}
1317	}
1318	#ifndef STB_VORBIS_NO_STDIO
1319	if (loc + f->f_start < loc \|\| loc >= 0x80000000) {
1320	loc = 0x7fffffff;
1321	f->eof = 1;
1322	} else {
1323	loc += f->f_start;
1324	}
1325	if (!fseek(f->f, loc, SEEK_SET0))
1326	return 1;
1327	f->eof = 1;
1328	fseek(f->f, f->f_start, SEEK_END2);
1329	return 0;
1330	#endif
1331	}
1332
1333
1334	static uint8 ogg_page_header[4] = { 0x4f, 0x67, 0x67, 0x53 };
1335
1336	static int capture_pattern(vorb *f)
1337	{
1338	if (0x4f != get8(f)) return FALSE0;
1339	if (0x67 != get8(f)) return FALSE0;
1340	if (0x67 != get8(f)) return FALSE0;
1341	if (0x53 != get8(f)) return FALSE0;
1342	return TRUE1;
1343	}
1344
1345	#define PAGEFLAG_continued_packet1 1
1346	#define PAGEFLAG_first_page2 2
1347	#define PAGEFLAG_last_page4 4
1348
1349	static int start_page_no_capturepattern(vorb *f)
1350	{
1351	uint32 loc0,loc1,n;
1352	int32 i;
1353	// stream structure version
1354	if (0 != get8(f)) return error(f, VORBIS_invalid_stream_structure_version);
1355	// header flag
1356	f->page_flag = get8(f);
1357	// absolute granule position
1358	loc0 = get32(f);
1359	loc1 = get32(f);
1360	// @TODO: validate loc0,loc1 as valid positions?
1361	// stream serial number -- vorbis doesn't interleave, so discard
1362	get32(f);
1363	//if (f->serial != get32(f)) return error(f, VORBIS_incorrect_stream_serial_number);
1364	// page sequence number
1365	n = get32(f);
1366	f->last_page = n;
1367	// CRC32
1368	get32(f);
1369	// page_segments
1370	f->segment_count = get8(f);
1371	if (!getn(f, f->segments, f->segment_count))
1372	return error(f, VORBIS_unexpected_eof);
1373	// assume we _don't_ know any the sample position of any segments
1374	f->end_seg_with_known_loc = -2;
1375	if (loc0 != ~0 \|\| loc1 != ~0) {
1376	// determine which packet is the last one that will complete
1377	for (i=f->segment_count-1; i >= 0; --i)
1378	if (f->segments[i] < 255)
1379	break;
1380	// 'i' is now the index of the _last_ segment of a packet that ends
1381	if (i >= 0) {
1382	f->end_seg_with_known_loc = i;
1383	f->known_loc_for_packet = loc0;
1384	}
1385	}
1386	if (f->first_decode) {
1387	int i,len;
1388	ProbedPage p;
1389	len = 0;
1390	for (i=0; i < f->segment_count; ++i)
1391	len += f->segments[i];
1392	len += 27 + f->segment_count;
1393	p.page_start = f->first_audio_page_offset;
1394	p.page_end = p.page_start + len;
1395	p.after_previous_page_start = p.page_start;
1396	p.first_decoded_sample = 0;
1397	p.last_decoded_sample = loc0;
1398	f->p_first = p;
1399	}
1400	f->next_seg = 0;
1401	return TRUE1;
1402	}
1403
1404	static int start_page(vorb *f)
1405	{
1406	if (!capture_pattern(f)) return error(f, VORBIS_missing_capture_pattern);
1407	return start_page_no_capturepattern(f);
1408	}
1409
1410	static int start_packet(vorb *f)
1411	{
1412	while (f->next_seg == -1) {
1413	if (!start_page(f)) return FALSE0;
1414	if (f->page_flag & PAGEFLAG_continued_packet1)
1415	return error(f, VORBIS_continued_packet_flag_invalid);
1416	}
1417	f->last_seg = FALSE0;
1418	f->valid_bits = 0;
1419	f->packet_bytes = 0;
1420	f->bytes_in_seg = 0;
1421	// f->next_seg is now valid
1422	return TRUE1;
1423	}
1424
1425	static int maybe_start_packet(vorb *f)
1426	{
1427	if (f->next_seg == -1) {
1428	int x = get8(f);
1429	if (f->eof) return FALSE0; // EOF at page boundary is not an error!
1430	if (0x4f != x ) return error(f, VORBIS_missing_capture_pattern);
1431	if (0x67 != get8(f)) return error(f, VORBIS_missing_capture_pattern);
1432	if (0x67 != get8(f)) return error(f, VORBIS_missing_capture_pattern);
1433	if (0x53 != get8(f)) return error(f, VORBIS_missing_capture_pattern);
1434	if (!start_page_no_capturepattern(f)) return FALSE0;
1435	if (f->page_flag & PAGEFLAG_continued_packet1) {
1436	// set up enough state that we can read this packet if we want,
1437	// e.g. during recovery
1438	f->last_seg = FALSE0;
1439	f->bytes_in_seg = 0;
1440	return error(f, VORBIS_continued_packet_flag_invalid);
1441	}
1442	}
1443	return start_packet(f);
1444	}
1445
1446	static int next_segment(vorb *f)
1447	{
1448	int len;
1449	if (f->last_seg) return 0;
1450	if (f->next_seg == -1) {
1451	f->last_seg_which = f->segment_count-1; // in case start_page fails
1452	if (!start_page(f)) { f->last_seg = 1; return 0; }
1453	if (!(f->page_flag & PAGEFLAG_continued_packet1)) return error(f, VORBIS_continued_packet_flag_invalid);
1454	}
1455	len = f->segments[f->next_seg++];
1456	if (len < 255) {
1457	f->last_seg = TRUE1;
1458	f->last_seg_which = f->next_seg-1;
1459	}
1460	if (f->next_seg >= f->segment_count)
1461	f->next_seg = -1;
1462	assert(f->bytes_in_seg == 0)((f->bytes_in_seg == 0) ? (void)0 : _assert("f->bytes_in_seg == 0" , "src/siege/internal/stb/stb_vorbis.c", 1462));
1463	f->bytes_in_seg = len;
1464	return len;
1465	}
1466
1467	#define EOP(-1) (-1)
1468	#define INVALID_BITS(-1) (-1)
1469
1470	static int get8_packet_raw(vorb *f)
1471	{
1472	if (!f->bytes_in_seg)
1473	{
1474	if (f->last_seg) return EOP(-1);
1475	else if (!next_segment(f)) return EOP(-1);
1476	}
1477	assert(f->bytes_in_seg > 0)((f->bytes_in_seg > 0) ? (void)0 : _assert("f->bytes_in_seg > 0" , "src/siege/internal/stb/stb_vorbis.c", 1477));
1478	--f->bytes_in_seg;
1479	++f->packet_bytes;
1480	return get8(f);
1481	}
1482
1483	static int get8_packet(vorb *f)
1484	{
1485	int x = get8_packet_raw(f);
1486	f->valid_bits = 0;
1487	return x;
1488	}
1489
1490	static void flush_packet(vorb *f)
1491	{
1492	while (get8_packet_raw(f) != EOP(-1));
1493	}
1494
1495	// @OPTIMIZE: this is the secondary bit decoder, so it's probably not as important
1496	// as the huffman decoder?
1497	static uint32 get_bits(vorb *f, int n)
1498	{
1499	uint32 z;
1500
1501	if (f->valid_bits < 0) return 0;
1502	if (f->valid_bits < n) {
1503	if (n > 24) {
1504	// the accumulator technique below would not work correctly in this case
1505	z = get_bits(f, 24);
1506	z += get_bits(f, n-24) << 24;
1507	return z;
1508	}
1509	if (f->valid_bits == 0) f->acc = 0;
1510	while (f->valid_bits < n) {
1511	int z = get8_packet_raw(f);
1512	if (z == EOP(-1)) {
1513	f->valid_bits = INVALID_BITS(-1);
1514	return 0;
1515	}
1516	f->acc += z << f->valid_bits;
1517	f->valid_bits += 8;
1518	}
1519	}
1520	if (f->valid_bits < 0) return 0;
1521	z = f->acc & ((1 << n)-1);
1522	f->acc >>= n;
1523	f->valid_bits -= n;
1524	return z;
1525	}
1526
1527	static int32 get_bits_signed(vorb *f, int n)
1528	{
1529	uint32 z = get_bits(f, n);
1530	if (z & (1 << (n-1)))
1531	z += ~((1 << n) - 1);
1532	return (int32) z;
1533	}
1534
1535	// @OPTIMIZE: primary accumulator for huffman
1536	// expand the buffer to as many bits as possible without reading off end of packet
1537	// it might be nice to allow f->valid_bits and f->acc to be stored in registers,
1538	// e.g. cache them locally and decode locally
1539	static __forceinlineinline void prep_huffman(vorb *f)
1540	{
1541	if (f->valid_bits <= 24) {
1542	if (f->valid_bits == 0) f->acc = 0;
1543	do {
1544	int z;
1545	if (f->last_seg && !f->bytes_in_seg) return;
1546	z = get8_packet_raw(f);
1547	if (z == EOP(-1)) return;
1548	f->acc += z << f->valid_bits;
1549	f->valid_bits += 8;
1550	} while (f->valid_bits <= 24);
1551	}
1552	}
1553
1554	enum
1555	{
1556	VORBIS_packet_id = 1,
1557	VORBIS_packet_comment = 3,
1558	VORBIS_packet_setup = 5,
1559	};
1560
1561	static int codebook_decode_scalar_raw(vorb f, Codebook c)
1562	{
1563	int i;
1564	prep_huffman(f);
1565
1566	assert(c->sorted_codewords \|\| c->codewords)((c->sorted_codewords \|\| c->codewords) ? (void)0 : _assert ("c->sorted_codewords \|\| c->codewords", "src/siege/internal/stb/stb_vorbis.c" , 1566));
1567	// cases to use binary search: sorted_codewords && !c->codewords
1568	// sorted_codewords && c->entries > 8
1569	if (c->entries > 8 ? c->sorted_codewords!=NULL((void*)0) : !c->codewords) {
1570	// binary search
1571	uint32 code = bit_reverse(f->acc);
1572	int x=0, n=c->sorted_entries, len;
1573
1574	while (n > 1) {
1575	// invariant: sc[x] <= code < sc[x+n]
1576	int m = x + (n >> 1);
1577	if (c->sorted_codewords[m] <= code) {
1578	x = m;
1579	n -= (n>>1);
1580	} else {
1581	n >>= 1;
1582	}
1583	}
1584	// x is now the sorted index
1585	if (!c->sparse) x = c->sorted_values[x];
1586	// x is now sorted index if sparse, or symbol otherwise
1587	len = c->codeword_lengths[x];
1588	if (f->valid_bits >= len) {
1589	f->acc >>= len;
1590	f->valid_bits -= len;
1591	return x;
1592	}
1593
1594	f->valid_bits = 0;
1595	return -1;
1596	}
1597
1598	// if small, linear search
1599	assert(!c->sparse)((!c->sparse) ? (void)0 : _assert("!c->sparse", "src/siege/internal/stb/stb_vorbis.c" , 1599));
1600	for (i=0; i < c->entries; ++i) {
1601	if (c->codeword_lengths[i] == NO_CODE255) continue;
1602	if (c->codewords[i] == (f->acc & ((1 << c->codeword_lengths[i])-1))) {
1603	if (f->valid_bits >= c->codeword_lengths[i]) {
1604	f->acc >>= c->codeword_lengths[i];
1605	f->valid_bits -= c->codeword_lengths[i];
1606	return i;
1607	}
1608	f->valid_bits = 0;
1609	return -1;
1610	}
1611	}
1612
1613	error(f, VORBIS_invalid_stream);
1614	f->valid_bits = 0;
1615	return -1;
1616	}
1617
1618	static int codebook_decode_scalar(vorb f, Codebook c)
1619	{
1620	int i;
1621	if (f->valid_bits < STB_VORBIS_FAST_HUFFMAN_LENGTH10)
1622	prep_huffman(f);
1623	// fast huffman table lookup
1624	i = f->acc & FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1);
1625	i = c->fast_huffman[i];
1626	if (i >= 0) {
1627	f->acc >>= c->codeword_lengths[i];
1628	f->valid_bits -= c->codeword_lengths[i];
1629	if (f->valid_bits < 0) { f->valid_bits = 0; return -1; }
1630	return i;
1631	}
1632	return codebook_decode_scalar_raw(f,c);
1633	}
1634
1635	#ifndef STB_VORBIS_NO_INLINE_DECODE
1636
1637	#define DECODE_RAW(var, f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } \
1638	if (f->valid_bits < STB_VORBIS_FAST_HUFFMAN_LENGTH10) \
1639	prep_huffman(f); \
1640	var = f->acc & FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1); \
1641	var = c->fast_huffman[var]; \
1642	if (var >= 0) { \
1643	int n = c->codeword_lengths[var]; \
1644	f->acc >>= n; \
1645	f->valid_bits -= n; \
1646	if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } \
1647	} else { \
1648	var = codebook_decode_scalar_raw(f,c); \
1649	}
1650
1651	#else
1652
1653	#define DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } var = codebook_decode_scalar(f,c);
1654
1655	#endif
1656
1657	#define DECODE(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } if (c->sparse) var = c->sorted_values[var]; \
1658	DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } \
1659	if (c->sparse) var = c->sorted_values[var];
1660
1661	#ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK
1662	#define DECODE_VQ(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); }
1663	#else
1664	#define DECODE_VQ(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } DECODE(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } if (c->sparse) var = c->sorted_values[var];
1665	#endif
1666
1667
1668
1669
1670
1671
1672	// CODEBOOK_ELEMENT_FAST is an optimization for the CODEBOOK_FLOATS case
1673	// where we avoid one addition
1674	#ifndef STB_VORBIS_CODEBOOK_FLOATS
1675	#define CODEBOOK_ELEMENT(c,off)(c->multiplicands[off]) (c->multiplicands[off] * c->delta_value + c->minimum_value)
1676	#define CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) (c->multiplicands[off] * c->delta_value)
1677	#define CODEBOOK_ELEMENT_BASE(c)(0) (c->minimum_value)
1678	#else
1679	#define CODEBOOK_ELEMENT(c,off)(c->multiplicands[off]) (c->multiplicands[off])
1680	#define CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) (c->multiplicands[off])
1681	#define CODEBOOK_ELEMENT_BASE(c)(0) (0)
1682	#endif
1683
1684	static int codebook_decode_start(vorb f, Codebook c, int len)
1685	{
1686	int z = -1;
1687
1688	// type 0 is only legal in a scalar context
1689	if (c->lookup_type == 0)
1690	error(f, VORBIS_invalid_stream);
1691	else {
1692	DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); };
1693	if (c->sparse) assert(z < c->sorted_entries)((z < c->sorted_entries) ? (void)0 : _assert("z < c->sorted_entries" , "src/siege/internal/stb/stb_vorbis.c", 1693));
1694	if (z < 0) { // check for EOP
1695	if (!f->bytes_in_seg)
1696	if (f->last_seg)
1697	return z;
1698	error(f, VORBIS_invalid_stream);
1699	}
1700	}
1701	return z;
1702	}
1703
1704	static int codebook_decode(vorb f, Codebook c, float *output, int len)
1705	{
1706	int i,z = codebook_decode_start(f,c,len);
1707	if (z < 0) return FALSE0;
1708	if (len > c->dimensions) len = c->dimensions;
1709
1710	#ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK
1711	if (c->lookup_type == 1) {
1712	float last = CODEBOOK_ELEMENT_BASE(c)(0);
1713	int div = 1;
1714	for (i=0; i < len; ++i) {
1715	int off = (z / div) % c->lookup_values;
1716	float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last;
1717	output[i] += val;
1718	if (c->sequence_p) last = val + c->minimum_value;
1719	div *= c->lookup_values;
1720	}
1721	return TRUE1;
1722	}
1723	#endif
1724
1725	z *= c->dimensions;
1726	if (c->sequence_p) {
1727	float last = CODEBOOK_ELEMENT_BASE(c)(0);
1728	for (i=0; i < len; ++i) {
1729	float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1730	output[i] += val;
1731	last = val + c->minimum_value;
1732	}
1733	} else {
1734	float last = CODEBOOK_ELEMENT_BASE(c)(0);
1735	for (i=0; i < len; ++i) {
1736	output[i] += CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1737	}
1738	}
1739
1740	return TRUE1;
1741	}
1742
1743	static int codebook_decode_step(vorb f, Codebook c, float *output, int len, int step)
1744	{
1745	int i,z = codebook_decode_start(f,c,len);
1746	float last = CODEBOOK_ELEMENT_BASE(c)(0);
1747	if (z < 0) return FALSE0;
1748	if (len > c->dimensions) len = c->dimensions;
1749
1750	#ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK
1751	if (c->lookup_type == 1) {
1752	int div = 1;
1753	for (i=0; i < len; ++i) {
1754	int off = (z / div) % c->lookup_values;
1755	float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last;
1756	output[i*step] += val;
1757	if (c->sequence_p) last = val;
1758	div *= c->lookup_values;
1759	}
1760	return TRUE1;
1761	}
1762	#endif
1763
1764	z *= c->dimensions;
1765	for (i=0; i < len; ++i) {
1766	float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1767	output[i*step] += val;
1768	if (c->sequence_p) last = val;
1769	}
1770
1771	return TRUE1;
1772	}
1773
1774	static int codebook_decode_deinterleave_repeat(vorb f, Codebook c, float *outputs, int ch, int c_inter_p, int *p_inter_p, int len, int total_decode)
1775	{
1776	int c_inter = *c_inter_p;
1777	int p_inter = *p_inter_p;
1778	int i,z, effective = c->dimensions;
1779
1780	// type 0 is only legal in a scalar context
1781	if (c->lookup_type == 0) return error(f, VORBIS_invalid_stream);
1782
1783	while (total_decode > 0) {
1784	float last = CODEBOOK_ELEMENT_BASE(c)(0);
1785	DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); };
1786	#ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK
1787	assert(!c->sparse \|\| z < c->sorted_entries)((!c->sparse \|\| z < c->sorted_entries) ? (void)0 : _assert ("!c->sparse \|\| z < c->sorted_entries", "src/siege/internal/stb/stb_vorbis.c" , 1787));
1788	#endif
1789	if (z < 0) {
1790	if (!f->bytes_in_seg)
1791	if (f->last_seg) return FALSE0;
1792	return error(f, VORBIS_invalid_stream);
1793	}
1794
1795	// if this will take us off the end of the buffers, stop short!
1796	// we check by computing the length of the virtual interleaved
1797	// buffer (lench), our current offset within it (p_interch)+(c_inter),
1798	// and the length we'll be using (effective)
1799	if (c_inter + p_interch + effective > len ch) {
1800	effective = lench - (p_interch - c_inter);
1801	}
1802
1803	#ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK
1804	if (c->lookup_type == 1) {
1805	int div = 1;
1806	for (i=0; i < effective; ++i) {
1807	int off = (z / div) % c->lookup_values;
1808	float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last;
1809	outputs[c_inter][p_inter] += val;
1810	if (++c_inter == ch) { c_inter = 0; ++p_inter; }
1811	if (c->sequence_p) last = val;
1812	div *= c->lookup_values;
1813	}
1814	} else
1815	#endif
1816	{
1817	z *= c->dimensions;
1818	if (c->sequence_p) {
1819	for (i=0; i < effective; ++i) {
1820	float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1821	outputs[c_inter][p_inter] += val;
1822	if (++c_inter == ch) { c_inter = 0; ++p_inter; }
1823	last = val;
1824	}
1825	} else {
1826	for (i=0; i < effective; ++i) {
1827	float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1828	outputs[c_inter][p_inter] += val;
1829	if (++c_inter == ch) { c_inter = 0; ++p_inter; }
1830	}
1831	}
1832	}
1833
1834	total_decode -= effective;
1835	}
1836	*c_inter_p = c_inter;
1837	*p_inter_p = p_inter;
1838	return TRUE1;
1839	}
1840
1841	#ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK
1842	static int codebook_decode_deinterleave_repeat_2(vorb f, Codebook c, float *outputs, int c_inter_p, int *p_inter_p, int len, int total_decode)
1843	{
1844	int c_inter = *c_inter_p;
1845	int p_inter = *p_inter_p;
1846	int i,z, effective = c->dimensions;
1847
1848	// type 0 is only legal in a scalar context
1849	if (c->lookup_type == 0) return error(f, VORBIS_invalid_stream);
1850
1851	while (total_decode > 0) {
1852	float last = CODEBOOK_ELEMENT_BASE(c)(0);
1853	DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); };
1854
1855	if (z < 0) {
1856	if (!f->bytes_in_seg)
1857	if (f->last_seg) return FALSE0;
1858	return error(f, VORBIS_invalid_stream);
1859	}
1860
1861	// if this will take us off the end of the buffers, stop short!
1862	// we check by computing the length of the virtual interleaved
1863	// buffer (lench), our current offset within it (p_interch)+(c_inter),
1864	// and the length we'll be using (effective)
1865	if (c_inter + p_inter2 + effective > len 2) {
1866	effective = len2 - (p_inter2 - c_inter);
1867	}
1868
1869	{
1870	z *= c->dimensions;
1871	stb_prof(11)(void)0;
1872	if (c->sequence_p) {
1873	// haven't optimized this case because I don't have any examples
1874	for (i=0; i < effective; ++i) {
1875	float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1876	outputs[c_inter][p_inter] += val;
1877	if (++c_inter == 2) { c_inter = 0; ++p_inter; }
1878	last = val;
1879	}
1880	} else {
1881	i=0;
1882	if (c_inter == 1) {
1883	float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1884	outputs[c_inter][p_inter] += val;
1885	c_inter = 0; ++p_inter;
1886	++i;
1887	}
1888	{
1889	float *z0 = outputs[0];
1890	float *z1 = outputs[1];
1891	for (; i+1 < effective;) {
1892	z0[p_inter] += CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1893	z1[p_inter] += CODEBOOK_ELEMENT_FAST(c,z+i+1)(c->multiplicands[z+i+1]) + last;
1894	++p_inter;
1895	i += 2;
1896	}
1897	}
1898	if (i < effective) {
1899	float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last;
1900	outputs[c_inter][p_inter] += val;
1901	if (++c_inter == 2) { c_inter = 0; ++p_inter; }
1902	}
1903	}
1904	}
1905
1906	total_decode -= effective;
1907	}
1908	*c_inter_p = c_inter;
1909	*p_inter_p = p_inter;
1910	return TRUE1;
1911	}
1912	#endif
1913
1914	static int predict_point(int x, int x0, int x1, int y0, int y1)
1915	{
1916	int dy = y1 - y0;
1917	int adx = x1 - x0;
1918	// @OPTIMIZE: force int division to round in the right direction... is this necessary on x86?
1919	int err = abs(dy) * (x - x0);
1920	int off = err / adx;
1921	return dy < 0 ? y0 - off : y0 + off;
1922	}
1923
1924	// the following table is block-copied from the specification
1925	static float inverse_db_table[256] =
1926	{
1927	1.0649863e-07f, 1.1341951e-07f, 1.2079015e-07f, 1.2863978e-07f,
1928	1.3699951e-07f, 1.4590251e-07f, 1.5538408e-07f, 1.6548181e-07f,
1929	1.7623575e-07f, 1.8768855e-07f, 1.9988561e-07f, 2.1287530e-07f,
1930	2.2670913e-07f, 2.4144197e-07f, 2.5713223e-07f, 2.7384213e-07f,
1931	2.9163793e-07f, 3.1059021e-07f, 3.3077411e-07f, 3.5226968e-07f,
1932	3.7516214e-07f, 3.9954229e-07f, 4.2550680e-07f, 4.5315863e-07f,
1933	4.8260743e-07f, 5.1396998e-07f, 5.4737065e-07f, 5.8294187e-07f,
1934	6.2082472e-07f, 6.6116941e-07f, 7.0413592e-07f, 7.4989464e-07f,
1935	7.9862701e-07f, 8.5052630e-07f, 9.0579828e-07f, 9.6466216e-07f,
1936	1.0273513e-06f, 1.0941144e-06f, 1.1652161e-06f, 1.2409384e-06f,
1937	1.3215816e-06f, 1.4074654e-06f, 1.4989305e-06f, 1.5963394e-06f,
1938	1.7000785e-06f, 1.8105592e-06f, 1.9282195e-06f, 2.0535261e-06f,
1939	2.1869758e-06f, 2.3290978e-06f, 2.4804557e-06f, 2.6416497e-06f,
1940	2.8133190e-06f, 2.9961443e-06f, 3.1908506e-06f, 3.3982101e-06f,
1941	3.6190449e-06f, 3.8542308e-06f, 4.1047004e-06f, 4.3714470e-06f,
1942	4.6555282e-06f, 4.9580707e-06f, 5.2802740e-06f, 5.6234160e-06f,
1943	5.9888572e-06f, 6.3780469e-06f, 6.7925283e-06f, 7.2339451e-06f,
1944	7.7040476e-06f, 8.2047000e-06f, 8.7378876e-06f, 9.3057248e-06f,
1945	9.9104632e-06f, 1.0554501e-05f, 1.1240392e-05f, 1.1970856e-05f,
1946	1.2748789e-05f, 1.3577278e-05f, 1.4459606e-05f, 1.5399272e-05f,
1947	1.6400004e-05f, 1.7465768e-05f, 1.8600792e-05f, 1.9809576e-05f,
1948	2.1096914e-05f, 2.2467911e-05f, 2.3928002e-05f, 2.5482978e-05f,
1949	2.7139006e-05f, 2.8902651e-05f, 3.0780908e-05f, 3.2781225e-05f,
1950	3.4911534e-05f, 3.7180282e-05f, 3.9596466e-05f, 4.2169667e-05f,
1951	4.4910090e-05f, 4.7828601e-05f, 5.0936773e-05f, 5.4246931e-05f,
1952	5.7772202e-05f, 6.1526565e-05f, 6.5524908e-05f, 6.9783085e-05f,
1953	7.4317983e-05f, 7.9147585e-05f, 8.4291040e-05f, 8.9768747e-05f,
1954	9.5602426e-05f, 0.00010181521f, 0.00010843174f, 0.00011547824f,
1955	0.00012298267f, 0.00013097477f, 0.00013948625f, 0.00014855085f,
1956	0.00015820453f, 0.00016848555f, 0.00017943469f, 0.00019109536f,
1957	0.00020351382f, 0.00021673929f, 0.00023082423f, 0.00024582449f,
1958	0.00026179955f, 0.00027881276f, 0.00029693158f, 0.00031622787f,
1959	0.00033677814f, 0.00035866388f, 0.00038197188f, 0.00040679456f,
1960	0.00043323036f, 0.00046138411f, 0.00049136745f, 0.00052329927f,
1961	0.00055730621f, 0.00059352311f, 0.00063209358f, 0.00067317058f,
1962	0.00071691700f, 0.00076350630f, 0.00081312324f, 0.00086596457f,
1963	0.00092223983f, 0.00098217216f, 0.0010459992f, 0.0011139742f,
1964	0.0011863665f, 0.0012634633f, 0.0013455702f, 0.0014330129f,
1965	0.0015261382f, 0.0016253153f, 0.0017309374f, 0.0018434235f,
1966	0.0019632195f, 0.0020908006f, 0.0022266726f, 0.0023713743f,
1967	0.0025254795f, 0.0026895994f, 0.0028643847f, 0.0030505286f,
1968	0.0032487691f, 0.0034598925f, 0.0036847358f, 0.0039241906f,
1969	0.0041792066f, 0.0044507950f, 0.0047400328f, 0.0050480668f,
1970	0.0053761186f, 0.0057254891f, 0.0060975636f, 0.0064938176f,
1971	0.0069158225f, 0.0073652516f, 0.0078438871f, 0.0083536271f,
1972	0.0088964928f, 0.009474637f, 0.010090352f, 0.010746080f,
1973	0.011444421f, 0.012188144f, 0.012980198f, 0.013823725f,
1974	0.014722068f, 0.015678791f, 0.016697687f, 0.017782797f,
1975	0.018938423f, 0.020169149f, 0.021479854f, 0.022875735f,
1976	0.024362330f, 0.025945531f, 0.027631618f, 0.029427276f,
1977	0.031339626f, 0.033376252f, 0.035545228f, 0.037855157f,
1978	0.040315199f, 0.042935108f, 0.045725273f, 0.048696758f,
1979	0.051861348f, 0.055231591f, 0.058820850f, 0.062643361f,
1980	0.066714279f, 0.071049749f, 0.075666962f, 0.080584227f,
1981	0.085821044f, 0.091398179f, 0.097337747f, 0.10366330f,
1982	0.11039993f, 0.11757434f, 0.12521498f, 0.13335215f,
1983	0.14201813f, 0.15124727f, 0.16107617f, 0.17154380f,
1984	0.18269168f, 0.19456402f, 0.20720788f, 0.22067342f,
1985	0.23501402f, 0.25028656f, 0.26655159f, 0.28387361f,
1986	0.30232132f, 0.32196786f, 0.34289114f, 0.36517414f,
1987	0.38890521f, 0.41417847f, 0.44109412f, 0.46975890f,
1988	0.50028648f, 0.53279791f, 0.56742212f, 0.60429640f,
1989	0.64356699f, 0.68538959f, 0.72993007f, 0.77736504f,
1990	0.82788260f, 0.88168307f, 0.9389798f, 1.0f
1991	};
1992
1993
1994	// @OPTIMIZE: if you want to replace this bresenham line-drawing routine,
1995	// note that you must produce bit-identical output to decode correctly;
1996	// this specific sequence of operations is specified in the spec (it's
1997	// drawing integer-quantized frequency-space lines that the encoder
1998	// expects to be exactly the same)
1999	// ... also, isn't the whole point of Bresenham's algorithm to NOT
2000	// have to divide in the setup? sigh.
2001	#ifndef STB_VORBIS_NO_DEFER_FLOOR
2002	#define LINE_OP(a,b)a = b a = b
2003	#else
2004	#define LINE_OP(a,b)a *= b a = b
2005	#endif
2006
2007	#ifdef STB_VORBIS_DIVIDE_TABLE
2008	#define DIVTAB_NUMER 32
2009	#define DIVTAB_DENOM 64
2010	int8 integer_divide_table[DIVTAB_NUMER][DIVTAB_DENOM]; // 2KB
2011	#endif
2012
2013	static __forceinlineinline void draw_line(float *output, int x0, int y0, int x1, int y1, int n)
2014	{
2015	int dy = y1 - y0;
2016	int adx = x1 - x0;
2017	int ady = abs(dy);
2018	int base;
2019	int x=x0,y=y0;
2020	int err = 0;
2021	int sy;
2022
2023	#ifdef STB_VORBIS_DIVIDE_TABLE
2024	if (adx < DIVTAB_DENOM && ady < DIVTAB_NUMER) {
2025	if (dy < 0) {
2026	base = -integer_divide_table[ady][adx];
2027	sy = base-1;
2028	} else {
2029	base = integer_divide_table[ady][adx];
2030	sy = base+1;
2031	}
2032	} else {
2033	base = dy / adx;
2034	if (dy < 0)
2035	sy = base - 1;
2036	else
2037	sy = base+1;
2038	}
2039	#else
2040	base = dy / adx;
2041	if (dy < 0)
2042	sy = base - 1;
2043	else
2044	sy = base+1;
2045	#endif
2046	ady -= abs(base) * adx;
2047	if (x1 > n) x1 = n;
2048	LINE_OP(output[x], inverse_db_table[y])output[x] *= inverse_db_table[y];
2049	for (++x; x < x1; ++x) {
2050	err += ady;
2051	if (err >= adx) {
2052	err -= adx;
2053	y += sy;
2054	} else
2055	y += base;
2056	LINE_OP(output[x], inverse_db_table[y])output[x] *= inverse_db_table[y];
2057	}
2058	}
2059
2060	static int residue_decode(vorb f, Codebook book, float *target, int offset, int n, int rtype)
2061	{
2062	int k;
2063	if (rtype == 0) {
2064	int step = n / book->dimensions;
2065	for (k=0; k < step; ++k)
2066	if (!codebook_decode_step(f, book, target+offset+k, n-offset-k, step))
2067	return FALSE0;
2068	} else {
2069	for (k=0; k < n; ) {
2070	if (!codebook_decode(f, book, target+offset, n-k))
2071	return FALSE0;
2072	k += book->dimensions;
2073	offset += book->dimensions;
2074	}
2075	}
2076	return TRUE1;
2077	}
2078
2079	static void decode_residue(vorb f, float residue_buffers[], int ch, int n, int rn, uint8 *do_not_decode)
2080	{
2081	int i,j,pass;
2082	Residue *r = f->residue_config + rn;
2083	int rtype = f->residue_types[rn];
2084	int c = r->classbook;
2085	int classwords = f->codebooks[c].dimensions;
2086	int n_read = r->end - r->begin;
2087	int part_read = n_read / r->part_size;
2088	int temp_alloc_point = temp_alloc_save(f)((f)->temp_offset);
2089	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2090	uint8 *part_classdata = (uint8 ) temp_block_array(f,f->channels, part_read sizeof(*part_classdata))make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(f->channels(sizeof(void )+(part_read sizeof(*part_classdata ))))) : alloca((f->channels(sizeof(void )+(part_read sizeof (*part_classdata)))))), f->channels, part_read sizeof(* *part_classdata));
2091	#else
2092	int classifications = (int ) temp_block_array(f,f->channels, part_read * sizeof(*classifications))make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(f->channels(sizeof(void )+(part_read sizeof(*classifications ))))) : alloca((f->channels(sizeof(void )+(part_read sizeof (*classifications)))))), f->channels, part_read sizeof( **classifications));
2093	#endif
2094
2095	stb_prof(2)(void)0;
2096	for (i=0; i < ch; ++i)
2097	if (!do_not_decode[i])
2098	memset(residue_buffers[i], 0, sizeof(float) * n);
2099
2100	if (rtype == 2 && ch != 1) {
2101	int len = ch * n;
2102	(void)len;
2103	for (j=0; j < ch; ++j)
2104	if (!do_not_decode[j])
2105	break;
2106	if (j == ch)
2107	goto done;
2108
2109	stb_prof(3)(void)0;
2110	for (pass=0; pass < 8; ++pass) {
2111	int pcount = 0, class_set = 0;
2112	if (ch == 2) {
2113	stb_prof(13)(void)0;
2114	while (pcount < part_read) {
2115	int z = r->begin + pcount*r->part_size;
2116	int c_inter = (z & 1), p_inter = z>>1;
2117	if (pass == 0) {
2118	Codebook *c = f->codebooks+r->classbook;
2119	int q;
2120	DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];;
2121	if (q == EOP(-1)) goto done;
2122	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2123	part_classdata[0][class_set] = r->classdata[q];
2124	#else
2125	for (i=classwords-1; i >= 0; --i) {
2126	classifications[0][i+pcount] = q % r->classifications;
2127	q /= r->classifications;
2128	}
2129	#endif
2130	}
2131	stb_prof(5)(void)0;
2132	for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) {
2133	int z = r->begin + pcount*r->part_size;
2134	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2135	int c = part_classdata[0][class_set][i];
2136	#else
2137	int c = classifications[0][pcount];
2138	#endif
2139	int b = r->residue_books[c][pass];
2140	if (b >= 0) {
2141	Codebook *book = f->codebooks + b;
2142	stb_prof(20)(void)0; // accounts for X time
2143	#ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK
2144	if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size))
2145	goto done;
2146	#else
2147	// saves 1%
2148	if (!codebook_decode_deinterleave_repeat_2(f, book, residue_buffers, &c_inter, &p_inter, n, r->part_size))
2149	goto done;
2150	#endif
2151	stb_prof(7)(void)0;
2152	} else {
2153	z += r->part_size;
2154	c_inter = z & 1;
2155	p_inter = z >> 1;
2156	}
2157	}
2158	stb_prof(8)(void)0;
2159	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2160	++class_set;
2161	#endif
2162	}
2163	} else if (ch == 1) {
2164	while (pcount < part_read) {
2165	int z = r->begin + pcount*r->part_size;
2166	int c_inter = 0, p_inter = z;
2167	if (pass == 0) {
2168	Codebook *c = f->codebooks+r->classbook;
2169	int q;
2170	DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];;
2171	if (q == EOP(-1)) goto done;
2172	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2173	part_classdata[0][class_set] = r->classdata[q];
2174	#else
2175	for (i=classwords-1; i >= 0; --i) {
2176	classifications[0][i+pcount] = q % r->classifications;
2177	q /= r->classifications;
2178	}
2179	#endif
2180	}
2181	for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) {
2182	int z = r->begin + pcount*r->part_size;
2183	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2184	int c = part_classdata[0][class_set][i];
2185	#else
2186	int c = classifications[0][pcount];
2187	#endif
2188	int b = r->residue_books[c][pass];
2189	if (b >= 0) {
2190	Codebook *book = f->codebooks + b;
2191	stb_prof(22)(void)0;
2192	if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size))
2193	goto done;
2194	stb_prof(3)(void)0;
2195	} else {
2196	z += r->part_size;
2197	c_inter = 0;
2198	p_inter = z;
2199	}
2200	}
2201	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2202	++class_set;
2203	#endif
2204	}
2205	} else {
2206	while (pcount < part_read) {
2207	int z = r->begin + pcount*r->part_size;
2208	int c_inter = z % ch, p_inter = z/ch;
2209	if (pass == 0) {
2210	Codebook *c = f->codebooks+r->classbook;
2211	int q;
2212	DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];;
2213	if (q == EOP(-1)) goto done;
2214	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2215	part_classdata[0][class_set] = r->classdata[q];
2216	#else
2217	for (i=classwords-1; i >= 0; --i) {
2218	classifications[0][i+pcount] = q % r->classifications;
2219	q /= r->classifications;
2220	}
2221	#endif
2222	}
2223	for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) {
2224	int z = r->begin + pcount*r->part_size;
2225	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2226	int c = part_classdata[0][class_set][i];
2227	#else
2228	int c = classifications[0][pcount];
2229	#endif
2230	int b = r->residue_books[c][pass];
2231	if (b >= 0) {
2232	Codebook *book = f->codebooks + b;
2233	stb_prof(22)(void)0;
2234	if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size))
2235	goto done;
2236	stb_prof(3)(void)0;
2237	} else {
2238	z += r->part_size;
2239	c_inter = z % ch;
2240	p_inter = z / ch;
2241	}
2242	}
2243	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2244	++class_set;
2245	#endif
2246	}
2247	}
2248	}
2249	goto done;
2250	}
2251	stb_prof(9)(void)0;
2252
2253	for (pass=0; pass < 8; ++pass) {
2254	int pcount = 0, class_set=0;
2255	while (pcount < part_read) {
2256	if (pass == 0) {
2257	for (j=0; j < ch; ++j) {
2258	if (!do_not_decode[j]) {
2259	Codebook *c = f->codebooks+r->classbook;
2260	int temp;
2261	DECODE(temp,f,c)if (f->valid_bits < 10) prep_huffman(f); temp = f->acc & ((1 << 10) - 1); temp = c->fast_huffman[temp] ; if (temp >= 0) { int n = c->codeword_lengths[temp]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; temp = -1; } } else { temp = codebook_decode_scalar_raw(f,c); } if (c->sparse) temp = c ->sorted_values[temp];;
2262	if (temp == EOP(-1)) goto done;
2263	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2264	part_classdata[j][class_set] = r->classdata[temp];
2265	#else
2266	for (i=classwords-1; i >= 0; --i) {
2267	classifications[j][i+pcount] = temp % r->classifications;
2268	temp /= r->classifications;
2269	}
2270	#endif
2271	}
2272	}
2273	}
2274	for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) {
2275	for (j=0; j < ch; ++j) {
2276	if (!do_not_decode[j]) {
2277	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2278	int c = part_classdata[j][class_set][i];
2279	#else
2280	int c = classifications[j][pcount];
2281	#endif
2282	int b = r->residue_books[c][pass];
2283	if (b >= 0) {
2284	float *target = residue_buffers[j];
2285	int offset = r->begin + pcount * r->part_size;
2286	int n = r->part_size;
2287	Codebook *book = f->codebooks + b;
2288	if (!residue_decode(f, book, target, offset, n, rtype))
2289	goto done;
2290	}
2291	}
2292	}
2293	}
2294	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
2295	++class_set;
2296	#endif
2297	}
2298	}
2299	done:
2300	stb_prof(0)(void)0;
2301	temp_alloc_restore(f,temp_alloc_point)((f)->temp_offset = (temp_alloc_point));
2302	}
2303
2304
2305	#if 0
2306	// slow way for debugging
2307	void inverse_mdct_slow(float *buffer, int n)
2308	{
2309	int i,j;
2310	int n2 = n >> 1;
2311	float x = (float ) malloc(sizeof(x) n2);
2312	memcpy(x, buffer, sizeof(x) n2);
2313	for (i=0; i < n; ++i) {
2314	float acc = 0;
2315	for (j=0; j < n2; ++j)
2316	// formula from paper:
2317	//acc += n/4.0f * x[j] * (float) cos(M_PI / 2 / n * (2 * i + 1 + n/2.0)(2j+1));
2318	// formula from wikipedia
2319	//acc += 2.0f / n2 * x[j] * (float) cos(M_PI/n2 * (i + 0.5 + n2/2)*(j + 0.5));
2320	// these are equivalent, except the formula from the paper inverts the multiplier!
2321	// however, what actually works is NO MULTIPLIER!?!
2322	//acc += 64 * 2.0f / n2 * x[j] * (float) cos(M_PI/n2 * (i + 0.5 + n2/2)*(j + 0.5));
2323	acc += x[j] * (float) cos(M_PI3.14159265358979323846 / 2 / n * (2 * i + 1 + n/2.0)(2j+1));
2324	buffer[i] = acc;
2325	}
2326	free(x);
2327	}
2328	#elif 0
2329	// same as above, but just barely able to run in real time on modern machines
2330	void inverse_mdct_slow(float buffer, int n, vorb f, int blocktype)
2331	{
2332	float mcos[16384];
2333	int i,j;
2334	int n2 = n >> 1, nmask = (n << 2) -1;
2335	float x = (float ) malloc(sizeof(x) n2);
2336	memcpy(x, buffer, sizeof(x) n2);
2337	for (i=0; i < 4*n; ++i)
2338	mcos[i] = (float) cos(M_PI3.14159265358979323846 / 2 * i / n);
2339
2340	for (i=0; i < n; ++i) {
2341	float acc = 0;
2342	for (j=0; j < n2; ++j)
2343	acc += x[j] * mcos[(2 * i + 1 + n2)(2j+1) & nmask];
2344	buffer[i] = acc;
2345	}
2346	free(x);
2347	}
2348	#else
2349	// transform to use a slow dct-iv; this is STILL basically trivial,
2350	// but only requires half as many ops
2351	void dct_iv_slow(float *buffer, int n)
2352	{
2353	float mcos[16384];
2354	float x[2048];
2355	int i,j;
2356	int n2 = n >> 1, nmask = (n << 3) - 1;
2357	(void)n2;
2358	memcpy(x, buffer, sizeof(x) n);
2359	for (i=0; i < 8*n; ++i)
2360	mcos[i] = (float) cos(M_PI3.14159265358979323846 / 4 * i / n);
2361	for (i=0; i < n; ++i) {
2362	float acc = 0;
2363	for (j=0; j < n; ++j)
2364	acc += x[j] * mcos[((2 * i + 1)(2j+1)) & nmask];
2365	//acc += x[j] * cos(M_PI / n * (i + 0.5) * (j + 0.5));
2366	buffer[i] = acc;
2367	}
2368	}
2369
2370	void inverse_mdct_slow(float buffer, int n, vorb f, int blocktype)
2371	{
2372	int i, n4 = n >> 2, n2 = n >> 1, n3_4 = n - n4;
2373	float temp[4096];
2374
2375	memcpy(temp, buffer, n2 * sizeof(float));
2376	dct_iv_slow(temp, n2); // returns -c'-d, a-b'
2377
2378	for (i=0; i < n4 ; ++i) buffer[i] = temp[i+n4]; // a-b'
2379	for ( ; i < n3_4; ++i) buffer[i] = -temp[n3_4 - i - 1]; // b-a', c+d'
2380	for ( ; i < n ; ++i) buffer[i] = -temp[i - n3_4]; // c'+d
2381	}
2382	#endif
2383
2384	#ifndef LIBVORBIS_MDCT0
2385	#define LIBVORBIS_MDCT0 0
2386	#endif
2387
2388	#if LIBVORBIS_MDCT0
2389	// directly call the vorbis MDCT using an interface documented
2390	// by Jeff Roberts... useful for performance comparison
2391	typedef struct
2392	{
2393	int n;
2394	int log2n;
2395
2396	float *trig;
2397	int *bitrev;
2398
2399	float scale;
2400	} mdct_lookup;
2401
2402	extern void mdct_init(mdct_lookup *lookup, int n);
2403	extern void mdct_clear(mdct_lookup *l);
2404	extern void mdct_backward(mdct_lookup init, float in, float *out);
2405
2406	mdct_lookup M1,M2;
2407
2408	void inverse_mdct(float buffer, int n, vorb f, int blocktype)
2409	{
2410	mdct_lookup *M;
2411	if (M1.n == n) M = &M1;
2412	else if (M2.n == n) M = &M2;
2413	else if (M1.n == 0) { mdct_init(&M1, n); M = &M1; }
2414	else {
2415	if (M2.n) __asm int 3;
2416	mdct_init(&M2, n);
2417	M = &M2;
2418	}
2419
2420	mdct_backward(M, buffer, buffer);
2421	}
2422	#endif
2423
2424
2425	// the following were split out into separate functions while optimizing;
2426	// they could be pushed back up but eh. __forceinline showed no change;
2427	// they're probably already being inlined.
2428	static void imdct_step3_iter0_loop(int n, float e, int i_off, int k_off, float A)
2429	{
2430	float *ee0 = e + i_off;
2431	float *ee2 = ee0 + k_off;
2432	int i;
2433
2434	assert((n & 3) == 0)(((n & 3) == 0) ? (void)0 : _assert("(n & 3) == 0", "src/siege/internal/stb/stb_vorbis.c" , 2434));
2435	for (i=(n>>2); i > 0; --i) {
2436	float k00_20, k01_21;
2437	k00_20 = ee0[ 0] - ee2[ 0];
2438	k01_21 = ee0[-1] - ee2[-1];
2439	ee0[ 0] += ee2[ 0];//ee0[ 0] = ee0[ 0] + ee2[ 0];
2440	ee0[-1] += ee2[-1];//ee0[-1] = ee0[-1] + ee2[-1];
2441	ee2[ 0] = k00_20 * A[0] - k01_21 * A[1];
2442	ee2[-1] = k01_21 * A[0] + k00_20 * A[1];
2443	A += 8;
2444
2445	k00_20 = ee0[-2] - ee2[-2];
2446	k01_21 = ee0[-3] - ee2[-3];
2447	ee0[-2] += ee2[-2];//ee0[-2] = ee0[-2] + ee2[-2];
2448	ee0[-3] += ee2[-3];//ee0[-3] = ee0[-3] + ee2[-3];
2449	ee2[-2] = k00_20 * A[0] - k01_21 * A[1];
2450	ee2[-3] = k01_21 * A[0] + k00_20 * A[1];
2451	A += 8;
2452
2453	k00_20 = ee0[-4] - ee2[-4];
2454	k01_21 = ee0[-5] - ee2[-5];
2455	ee0[-4] += ee2[-4];//ee0[-4] = ee0[-4] + ee2[-4];
2456	ee0[-5] += ee2[-5];//ee0[-5] = ee0[-5] + ee2[-5];
2457	ee2[-4] = k00_20 * A[0] - k01_21 * A[1];
2458	ee2[-5] = k01_21 * A[0] + k00_20 * A[1];
2459	A += 8;
2460
2461	k00_20 = ee0[-6] - ee2[-6];
2462	k01_21 = ee0[-7] - ee2[-7];
2463	ee0[-6] += ee2[-6];//ee0[-6] = ee0[-6] + ee2[-6];
2464	ee0[-7] += ee2[-7];//ee0[-7] = ee0[-7] + ee2[-7];
2465	ee2[-6] = k00_20 * A[0] - k01_21 * A[1];
2466	ee2[-7] = k01_21 * A[0] + k00_20 * A[1];
2467	A += 8;
2468	ee0 -= 8;
2469	ee2 -= 8;
2470	}
2471	}
2472
2473	static void imdct_step3_inner_r_loop(int lim, float e, int d0, int k_off, float A, int k1)
2474	{
2475	int i;
2476	float k00_20, k01_21;
2477
2478	float *e0 = e + d0;
2479	float *e2 = e0 + k_off;
2480
2481	for (i=lim >> 2; i > 0; --i) {
2482	k00_20 = e0[-0] - e2[-0];
2483	k01_21 = e0[-1] - e2[-1];
2484	e0[-0] += e2[-0];//e0[-0] = e0[-0] + e2[-0];
2485	e0[-1] += e2[-1];//e0[-1] = e0[-1] + e2[-1];
2486	e2[-0] = (k00_20)A[0] - (k01_21) A[1];
2487	e2[-1] = (k01_21)A[0] + (k00_20) A[1];
2488
2489	A += k1;
2490
2491	k00_20 = e0[-2] - e2[-2];
2492	k01_21 = e0[-3] - e2[-3];
2493	e0[-2] += e2[-2];//e0[-2] = e0[-2] + e2[-2];
2494	e0[-3] += e2[-3];//e0[-3] = e0[-3] + e2[-3];
2495	e2[-2] = (k00_20)A[0] - (k01_21) A[1];
2496	e2[-3] = (k01_21)A[0] + (k00_20) A[1];
2497
2498	A += k1;
2499
2500	k00_20 = e0[-4] - e2[-4];
2501	k01_21 = e0[-5] - e2[-5];
2502	e0[-4] += e2[-4];//e0[-4] = e0[-4] + e2[-4];
2503	e0[-5] += e2[-5];//e0[-5] = e0[-5] + e2[-5];
2504	e2[-4] = (k00_20)A[0] - (k01_21) A[1];
2505	e2[-5] = (k01_21)A[0] + (k00_20) A[1];
2506
2507	A += k1;
2508
2509	k00_20 = e0[-6] - e2[-6];
2510	k01_21 = e0[-7] - e2[-7];
2511	e0[-6] += e2[-6];//e0[-6] = e0[-6] + e2[-6];
2512	e0[-7] += e2[-7];//e0[-7] = e0[-7] + e2[-7];
2513	e2[-6] = (k00_20)A[0] - (k01_21) A[1];
2514	e2[-7] = (k01_21)A[0] + (k00_20) A[1];
2515
2516	e0 -= 8;
2517	e2 -= 8;
2518
2519	A += k1;
2520	}
2521	}
2522
2523	static void imdct_step3_inner_s_loop(int n, float e, int i_off, int k_off, float A, int a_off, int k0)
2524	{
2525	int i;
2526	float A0 = A[0];
2527	float A1 = A[0+1];
2528	float A2 = A[0+a_off];
2529	float A3 = A[0+a_off+1];
2530	float A4 = A[0+a_off*2+0];
2531	float A5 = A[0+a_off*2+1];
2532	float A6 = A[0+a_off*3+0];
2533	float A7 = A[0+a_off*3+1];
2534
2535	float k00,k11;
2536
2537	float *ee0 = e +i_off;
2538	float *ee2 = ee0+k_off;
2539
2540	for (i=n; i > 0; --i) {
2541	k00 = ee0[ 0] - ee2[ 0];
2542	k11 = ee0[-1] - ee2[-1];
2543	ee0[ 0] = ee0[ 0] + ee2[ 0];
2544	ee0[-1] = ee0[-1] + ee2[-1];
2545	ee2[ 0] = (k00) * A0 - (k11) * A1;
2546	ee2[-1] = (k11) * A0 + (k00) * A1;
2547
2548	k00 = ee0[-2] - ee2[-2];
2549	k11 = ee0[-3] - ee2[-3];
2550	ee0[-2] = ee0[-2] + ee2[-2];
2551	ee0[-3] = ee0[-3] + ee2[-3];
2552	ee2[-2] = (k00) * A2 - (k11) * A3;
2553	ee2[-3] = (k11) * A2 + (k00) * A3;
2554
2555	k00 = ee0[-4] - ee2[-4];
2556	k11 = ee0[-5] - ee2[-5];
2557	ee0[-4] = ee0[-4] + ee2[-4];
2558	ee0[-5] = ee0[-5] + ee2[-5];
2559	ee2[-4] = (k00) * A4 - (k11) * A5;
2560	ee2[-5] = (k11) * A4 + (k00) * A5;
2561
2562	k00 = ee0[-6] - ee2[-6];
2563	k11 = ee0[-7] - ee2[-7];
2564	ee0[-6] = ee0[-6] + ee2[-6];
2565	ee0[-7] = ee0[-7] + ee2[-7];
2566	ee2[-6] = (k00) * A6 - (k11) * A7;
2567	ee2[-7] = (k11) * A6 + (k00) * A7;
2568
2569	ee0 -= k0;
2570	ee2 -= k0;
2571	}
2572	}
2573
2574	static __forceinlineinline void iter_54(float *z)
2575	{
2576	float k00,k11,k22,k33;
2577	float y0,y1,y2,y3;
2578
2579	k00 = z[ 0] - z[-4];
2580	y0 = z[ 0] + z[-4];
2581	y2 = z[-2] + z[-6];
2582	k22 = z[-2] - z[-6];
2583
2584	z[-0] = y0 + y2; // z0 + z4 + z2 + z6
2585	z[-2] = y0 - y2; // z0 + z4 - z2 - z6
2586
2587	// done with y0,y2
2588
2589	k33 = z[-3] - z[-7];
2590
2591	z[-4] = k00 + k33; // z0 - z4 + z3 - z7
2592	z[-6] = k00 - k33; // z0 - z4 - z3 + z7
2593
2594	// done with k33
2595
2596	k11 = z[-1] - z[-5];
2597	y1 = z[-1] + z[-5];
2598	y3 = z[-3] + z[-7];
2599
2600	z[-1] = y1 + y3; // z1 + z5 + z3 + z7
2601	z[-3] = y1 - y3; // z1 + z5 - z3 - z7
2602	z[-5] = k11 - k22; // z1 - z5 + z2 - z6
2603	z[-7] = k11 + k22; // z1 - z5 - z2 + z6
2604	}
2605
2606	static void imdct_step3_inner_s_loop_ld654(int n, float e, int i_off, float A, int base_n)
2607	{
2608	int k_off = -8;
2609	(void)k_off;
2610	int a_off = base_n >> 3;
2611	float A2 = A[0+a_off];
2612	float *z = e + i_off;
2613	float base = z - 16 n;
2614
2615	while (z > base) {
2616	float k00,k11;
2617
2618	k00 = z[-0] - z[-8];
2619	k11 = z[-1] - z[-9];
2620	z[-0] = z[-0] + z[-8];
2621	z[-1] = z[-1] + z[-9];
2622	z[-8] = k00;
2623	z[-9] = k11 ;
2624
2625	k00 = z[ -2] - z[-10];
2626	k11 = z[ -3] - z[-11];
2627	z[ -2] = z[ -2] + z[-10];
2628	z[ -3] = z[ -3] + z[-11];
2629	z[-10] = (k00+k11) * A2;
2630	z[-11] = (k11-k00) * A2;
2631
2632	k00 = z[-12] - z[ -4]; // reverse to avoid a unary negation
2633	k11 = z[ -5] - z[-13];
2634	z[ -4] = z[ -4] + z[-12];
2635	z[ -5] = z[ -5] + z[-13];
2636	z[-12] = k11;
2637	z[-13] = k00;
2638
2639	k00 = z[-14] - z[ -6]; // reverse to avoid a unary negation
2640	k11 = z[ -7] - z[-15];
2641	z[ -6] = z[ -6] + z[-14];
2642	z[ -7] = z[ -7] + z[-15];
2643	z[-14] = (k00+k11) * A2;
2644	z[-15] = (k00-k11) * A2;
2645
2646	iter_54(z);
2647	iter_54(z-8);
2648	z -= 16;
2649	}
2650	}
2651
2652	static void inverse_mdct(float buffer, int n, vorb f, int blocktype)
2653	{
2654	int n2 = n >> 1, n4 = n >> 2, n8 = n >> 3, l;
2655	int n3_4 = n - n4, ld;
2656	(void)n3_4;
2657	// @OPTIMIZE: reduce register pressure by using fewer variables?
2658	int save_point = temp_alloc_save(f)((f)->temp_offset);
2659	float buf2 = (float ) temp_alloc(f, n2 * sizeof(buf2))(f->alloc.alloc_buffer ? setup_temp_malloc(f,n2 sizeof(* buf2)) : alloca(n2 * sizeof(*buf2)));
2660	float u=NULL((void)0),v=NULL((void)0);
2661	// twiddle factors
2662	float *A = f->A[blocktype];
2663
2664	// IMDCT algorithm from "The use of multirate filter banks for coding of high quality digital audio"
2665	// See notes about bugs in that paper in less-optimal implementation 'inverse_mdct_old' after this function.
2666
2667	// kernel from paper
2668
2669
2670	// merged:
2671	// copy and reflect spectral data
2672	// step 0
2673
2674	// note that it turns out that the items added together during
2675	// this step are, in fact, being added to themselves (as reflected
2676	// by step 0). inexplicable inefficiency! this became obvious
2677	// once I combined the passes.
2678
2679	// so there's a missing 'times 2' here (for adding X to itself).
2680	// this propogates through linearly to the end, where the numbers
2681	// are 1/2 too small, and need to be compensated for.
2682
2683	{
2684	float d,e, AA, e_stop;
2685	d = &buf2[n2-2];
2686	AA = A;
2687	e = &buffer[0];
2688	e_stop = &buffer[n2];
2689	while (e != e_stop) {
2690	d[1] = (e[0] * AA[0] - e[2]*AA[1]);
2691	d[0] = (e[0] * AA[1] + e[2]*AA[0]);
2692	d -= 2;
2693	AA += 2;
2694	e += 4;
2695	}
2696
2697	e = &buffer[n2-3];
2698	while (d >= buf2) {
2699	d[1] = (-e[2] * AA[0] - -e[0]*AA[1]);
2700	d[0] = (-e[2] * AA[1] + -e[0]*AA[0]);
2701	d -= 2;
2702	AA += 2;
2703	e -= 4;
2704	}
2705	}
2706
2707	// now we use symbolic names for these, so that we can
2708	// possibly swap their meaning as we change which operations
2709	// are in place
2710
2711	u = buffer;
2712	v = buf2;
2713
2714	// step 2 (paper output is w, now u)
2715	// this could be in place, but the data ends up in the wrong
2716	// place... _somebody_'s got to swap it, so this is nominated
2717	{
2718	float *AA = &A[n2-8];
2719	float d0,d1, e0, e1;
2720
2721	e0 = &v[n4];
2722	e1 = &v[0];
2723
2724	d0 = &u[n4];
2725	d1 = &u[0];
2726
2727	while (AA >= A) {
2728	float v40_20, v41_21;
2729
2730	v41_21 = e0[1] - e1[1];
2731	v40_20 = e0[0] - e1[0];
2732	d0[1] = e0[1] + e1[1];
2733	d0[0] = e0[0] + e1[0];
2734	d1[1] = v41_21AA[4] - v40_20AA[5];
2735	d1[0] = v40_20AA[4] + v41_21AA[5];
2736
2737	v41_21 = e0[3] - e1[3];
2738	v40_20 = e0[2] - e1[2];
2739	d0[3] = e0[3] + e1[3];
2740	d0[2] = e0[2] + e1[2];
2741	d1[3] = v41_21AA[0] - v40_20AA[1];
2742	d1[2] = v40_20AA[0] + v41_21AA[1];
2743
2744	AA -= 8;
2745
2746	d0 += 4;
2747	d1 += 4;
2748	e0 += 4;
2749	e1 += 4;
2750	}
2751	}
2752
2753	// step 3
2754	ld = ilog(n) - 1; // ilog is off-by-one from normal definitions
2755
2756	// optimized step 3:
2757
2758	// the original step3 loop can be nested r inside s or s inside r;
2759	// it's written originally as s inside r, but this is dumb when r
2760	// iterates many times, and s few. So I have two copies of it and
2761	// switch between them halfway.
2762
2763	// this is iteration 0 of step 3
2764	imdct_step3_iter0_loop(n >> 4, u, n2-1-n4*0, -(n >> 3), A);
2765	imdct_step3_iter0_loop(n >> 4, u, n2-1-n4*1, -(n >> 3), A);
2766
2767	// this is iteration 1 of step 3
2768	imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*0, -(n >> 4), A, 16);
2769	imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*1, -(n >> 4), A, 16);
2770	imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*2, -(n >> 4), A, 16);
2771	imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*3, -(n >> 4), A, 16);
2772
2773	l=2;
2774	for (; l < (ld-3)>>1; ++l) {
2775	int k0 = n >> (l+2), k0_2 = k0>>1;
2776	int lim = 1 << (l+1);
2777	int i;
2778	for (i=0; i < lim; ++i)
2779	imdct_step3_inner_r_loop(n >> (l+4), u, n2-1 - k0*i, -k0_2, A, 1 << (l+3));
2780	}
2781
2782	for (; l < ld-6; ++l) {
2783	int k0 = n >> (l+2), k1 = 1 << (l+3), k0_2 = k0>>1;
2784	int rlim = n >> (l+6), r;
2785	int lim = 1 << (l+1);
2786	int i_off;
2787	float *A0 = A;
2788	i_off = n2-1;
2789	for (r=rlim; r > 0; --r) {
2790	imdct_step3_inner_s_loop(lim, u, i_off, -k0_2, A0, k1, k0);
2791	A0 += k1*4;
2792	i_off -= 8;
2793	}
2794	}
2795
2796	// iterations with count:
2797	// ld-6,-5,-4 all interleaved together
2798	// the big win comes from getting rid of needless flops
2799	// due to the constants on pass 5 & 4 being all 1 and 0;
2800	// combining them to be simultaneous to improve cache made little difference
2801	imdct_step3_inner_s_loop_ld654(n >> 5, u, n2-1, A, n);
2802
2803	// output is u
2804
2805	// step 4, 5, and 6
2806	// cannot be in-place because of step 5
2807	{
2808	uint16 *bitrev = f->bit_reverse[blocktype];
2809	// weirdly, I'd have thought reading sequentially and writing
2810	// erratically would have been better than vice-versa, but in
2811	// fact that's not what my testing showed. (That is, with
2812	// j = bitreverse(i), do you read i and write j, or read j and write i.)
2813
2814	float *d0 = &v[n4-4];
2815	float *d1 = &v[n2-4];
2816	while (d0 >= v) {
2817	int k4;
2818
2819	k4 = bitrev[0];
2820	d1[3] = u[k4+0];
2821	d1[2] = u[k4+1];
2822	d0[3] = u[k4+2];
2823	d0[2] = u[k4+3];
2824
2825	k4 = bitrev[1];
2826	d1[1] = u[k4+0];
2827	d1[0] = u[k4+1];
2828	d0[1] = u[k4+2];
2829	d0[0] = u[k4+3];
2830
2831	d0 -= 4;
2832	d1 -= 4;
2833	bitrev += 2;
2834	}
2835	}
2836	// (paper output is u, now v)
2837
2838
2839	// data must be in buf2
2840	assert(v == buf2)((v == buf2) ? (void)0 : _assert("v == buf2", "src/siege/internal/stb/stb_vorbis.c" , 2840));
2841
2842	// step 7 (paper output is v, now v)
2843	// this is now in place
2844	{
2845	float *C(2 \| 4 \| 1) = f->C(2 \| 4 \| 1)[blocktype];
2846	float d, e;
2847
2848	d = v;
2849	e = v + n2 - 4;
2850
2851	while (d < e) {
2852	float a02,a11,b0,b1,b2,b3;
2853
2854	a02 = d[0] - e[2];
2855	a11 = d[1] + e[3];
2856
2857	b0 = C(2 \| 4 \| 1)[1]a02 + C(2 \| 4 \| 1)[0]a11;
2858	b1 = C(2 \| 4 \| 1)[1]a11 - C(2 \| 4 \| 1)[0]a02;
2859
2860	b2 = d[0] + e[ 2];
2861	b3 = d[1] - e[ 3];
2862
2863	d[0] = b2 + b0;
2864	d[1] = b3 + b1;
2865	e[2] = b2 - b0;
2866	e[3] = b1 - b3;
2867
2868	a02 = d[2] - e[0];
2869	a11 = d[3] + e[1];
2870
2871	b0 = C(2 \| 4 \| 1)[3]a02 + C(2 \| 4 \| 1)[2]a11;
2872	b1 = C(2 \| 4 \| 1)[3]a11 - C(2 \| 4 \| 1)[2]a02;
2873
2874	b2 = d[2] + e[ 0];
2875	b3 = d[3] - e[ 1];
2876
2877	d[2] = b2 + b0;
2878	d[3] = b3 + b1;
2879	e[0] = b2 - b0;
2880	e[1] = b1 - b3;
2881
2882	C(2 \| 4 \| 1) += 4;
2883	d += 4;
2884	e -= 4;
2885	}
2886	}
2887
2888	// data must be in buf2
2889
2890
2891	// step 8+decode (paper output is X, now buffer)
2892	// this generates pairs of data a la 8 and pushes them directly through
2893	// the decode kernel (pushing rather than pulling) to avoid having
2894	// to make another pass later
2895
2896	// this cannot POSSIBLY be in place, so we refer to the buffers directly
2897
2898	{
2899	float d0,d1,d2,d3;
2900
2901	float *B = f->B[blocktype] + n2 - 8;
2902	float *e = buf2 + n2 - 8;
2903	d0 = &buffer[0];
2904	d1 = &buffer[n2-4];
2905	d2 = &buffer[n2];
2906	d3 = &buffer[n-4];
2907	while (e >= v) {
2908	float p0,p1,p2,p3;
2909
2910	p3 = e[6]B[7] - e[7]B[6];
2911	p2 = -e[6]B[6] - e[7]B[7];
2912
2913	d0[0] = p3;
2914	d1[3] = - p3;
2915	d2[0] = p2;
2916	d3[3] = p2;
2917
2918	p1 = e[4]B[5] - e[5]B[4];
2919	p0 = -e[4]B[4] - e[5]B[5];
2920
2921	d0[1] = p1;
2922	d1[2] = - p1;
2923	d2[1] = p0;
2924	d3[2] = p0;
2925
2926	p3 = e[2]B[3] - e[3]B[2];
2927	p2 = -e[2]B[2] - e[3]B[3];
2928
2929	d0[2] = p3;
2930	d1[1] = - p3;
2931	d2[2] = p2;
2932	d3[1] = p2;
2933
2934	p1 = e[0]B[1] - e[1]B[0];
2935	p0 = -e[0]B[0] - e[1]B[1];
2936
2937	d0[3] = p1;
2938	d1[0] = - p1;
2939	d2[3] = p0;
2940	d3[0] = p0;
2941
2942	B -= 8;
2943	e -= 8;
2944	d0 += 4;
2945	d2 += 4;
2946	d1 -= 4;
2947	d3 -= 4;
2948	}
2949	}
2950
2951	temp_alloc_restore(f,save_point)((f)->temp_offset = (save_point));
2952	}
2953
2954	#if 0
2955	// this is the original version of the above code, if you want to optimize it from scratch
2956	void inverse_mdct_naive(float *buffer, int n)
2957	{
2958	float s;
2959	float A[1 << 12], B[1 << 12], C(2 \| 4 \| 1)[1 << 11];
2960	int i,k,k2,k4, n2 = n >> 1, n4 = n >> 2, n8 = n >> 3, l;
2961	int n3_4 = n - n4, ld;
2962	// how can they claim this only uses N words?!
2963	// oh, because they're only used sparsely, whoops
2964	float u[1 << 13], X[1 << 13], v[1 << 13], w[1 << 13];
2965	// set up twiddle factors
2966
2967	for (k=k2=0; k < n4; ++k,k2+=2) {
2968	A[k2 ] = (float) cos(4kM_PI3.14159265358979323846/n);
2969	A[k2+1] = (float) -sin(4kM_PI3.14159265358979323846/n);
2970	B[k2 ] = (float) cos((k2+1)*M_PI3.14159265358979323846/n/2);
2971	B[k2+1] = (float) sin((k2+1)*M_PI3.14159265358979323846/n/2);
2972	}
2973	for (k=k2=0; k < n8; ++k,k2+=2) {
2974	C(2 \| 4 \| 1)[k2 ] = (float) cos(2(k2+1)M_PI3.14159265358979323846/n);
2975	C(2 \| 4 \| 1)[k2+1] = (float) -sin(2(k2+1)M_PI3.14159265358979323846/n);
2976	}
2977
2978	// IMDCT algorithm from "The use of multirate filter banks for coding of high quality digital audio"
2979	// Note there are bugs in that pseudocode, presumably due to them attempting
2980	// to rename the arrays nicely rather than representing the way their actual
2981	// implementation bounces buffers back and forth. As a result, even in the
2982	// "some formulars corrected" version, a direct implementation fails. These
2983	// are noted below as "paper bug".
2984
2985	// copy and reflect spectral data
2986	for (k=0; k < n2; ++k) u[k] = buffer[k];
2987	for ( ; k < n ; ++k) u[k] = -buffer[n - k - 1];
2988	// kernel from paper
2989	// step 1
2990	for (k=k2=k4=0; k < n4; k+=1, k2+=2, k4+=4) {
2991	v[n-k4-1] = (u[k4] - u[n-k4-1]) * A[k2] - (u[k4+2] - u[n-k4-3])*A[k2+1];
2992	v[n-k4-3] = (u[k4] - u[n-k4-1]) * A[k2+1] + (u[k4+2] - u[n-k4-3])*A[k2];
2993	}
2994	// step 2
2995	for (k=k4=0; k < n8; k+=1, k4+=4) {
2996	w[n2+3+k4] = v[n2+3+k4] + v[k4+3];
2997	w[n2+1+k4] = v[n2+1+k4] + v[k4+1];
2998	w[k4+3] = (v[n2+3+k4] - v[k4+3])A[n2-4-k4] - (v[n2+1+k4]-v[k4+1])A[n2-3-k4];
2999	w[k4+1] = (v[n2+1+k4] - v[k4+1])A[n2-4-k4] + (v[n2+3+k4]-v[k4+3])A[n2-3-k4];
3000	}
3001	// step 3
3002	ld = ilog(n) - 1; // ilog is off-by-one from normal definitions
3003	for (l=0; l < ld-3; ++l) {
3004	int k0 = n >> (l+2), k1 = 1 << (l+3);
3005	int rlim = n >> (l+4), r4, r;
3006	int s2lim = 1 << (l+2), s2;
3007	for (r=r4=0; r < rlim; r4+=4,++r) {
3008	for (s2=0; s2 < s2lim; s2+=2) {
3009	u[n-1-k0s2-r4] = w[n-1-k0s2-r4] + w[n-1-k0*(s2+1)-r4];
3010	u[n-3-k0s2-r4] = w[n-3-k0s2-r4] + w[n-3-k0*(s2+1)-r4];
3011	u[n-1-k0(s2+1)-r4] = (w[n-1-k0s2-r4] - w[n-1-k0(s2+1)-r4]) A[r*k1]
3012	- (w[n-3-k0s2-r4] - w[n-3-k0(s2+1)-r4]) * A[r*k1+1];
3013	u[n-3-k0(s2+1)-r4] = (w[n-3-k0s2-r4] - w[n-3-k0(s2+1)-r4]) A[r*k1]
3014	+ (w[n-1-k0s2-r4] - w[n-1-k0(s2+1)-r4]) * A[r*k1+1];
3015	}
3016	}
3017	if (l+1 < ld-3) {
3018	// paper bug: ping-ponging of u&w here is omitted
3019	memcpy(w, u, sizeof(u));
3020	}
3021	}
3022
3023	// step 4
3024	for (i=0; i < n8; ++i) {
3025	int j = bit_reverse(i) >> (32-ld+3);
3026	assert(j < n8)((j < n8) ? (void)0 : _assert("j < n8", "src/siege/internal/stb/stb_vorbis.c" , 3026));
3027	if (i == j) {
3028	// paper bug: original code probably swapped in place; if copying,
3029	// need to directly copy in this case
3030	int i8 = i << 3;
3031	v[i8+1] = u[i8+1];
3032	v[i8+3] = u[i8+3];
3033	v[i8+5] = u[i8+5];
3034	v[i8+7] = u[i8+7];
3035	} else if (i < j) {
3036	int i8 = i << 3, j8 = j << 3;
3037	v[j8+1] = u[i8+1], v[i8+1] = u[j8 + 1];
3038	v[j8+3] = u[i8+3], v[i8+3] = u[j8 + 3];
3039	v[j8+5] = u[i8+5], v[i8+5] = u[j8 + 5];
3040	v[j8+7] = u[i8+7], v[i8+7] = u[j8 + 7];
3041	}
3042	}
3043	// step 5
3044	for (k=0; k < n2; ++k) {
3045	w[k] = v[k*2+1];
3046	}
3047	// step 6
3048	for (k=k2=k4=0; k < n8; ++k, k2 += 2, k4 += 4) {
3049	u[n-1-k2] = w[k4];
3050	u[n-2-k2] = w[k4+1];
3051	u[n3_4 - 1 - k2] = w[k4+2];
3052	u[n3_4 - 2 - k2] = w[k4+3];
3053	}
3054	// step 7
3055	for (k=k2=0; k < n8; ++k, k2 += 2) {
3056	v[n2 + k2 ] = ( u[n2 + k2] + u[n-2-k2] + C(2 \| 4 \| 1)[k2+1](u[n2+k2]-u[n-2-k2]) + C(2 \| 4 \| 1)[k2](u[n2+k2+1]+u[n-2-k2+1]))/2;
3057	v[n-2 - k2] = ( u[n2 + k2] + u[n-2-k2] - C(2 \| 4 \| 1)[k2+1](u[n2+k2]-u[n-2-k2]) - C(2 \| 4 \| 1)[k2](u[n2+k2+1]+u[n-2-k2+1]))/2;
3058	v[n2+1+ k2] = ( u[n2+1+k2] - u[n-1-k2] + C(2 \| 4 \| 1)[k2+1](u[n2+1+k2]+u[n-1-k2]) - C(2 \| 4 \| 1)[k2](u[n2+k2]-u[n-2-k2]))/2;
3059	v[n-1 - k2] = (-u[n2+1+k2] + u[n-1-k2] + C(2 \| 4 \| 1)[k2+1](u[n2+1+k2]+u[n-1-k2]) - C(2 \| 4 \| 1)[k2](u[n2+k2]-u[n-2-k2]))/2;
3060	}
3061	// step 8
3062	for (k=k2=0; k < n4; ++k,k2 += 2) {
3063	X[k] = v[k2+n2]B[k2 ] + v[k2+1+n2]B[k2+1];
3064	X[n2-1-k] = v[k2+n2]B[k2+1] - v[k2+1+n2]B[k2 ];
3065	}
3066
3067	// decode kernel to output
3068	// determined the following value experimentally
3069	// (by first figuring out what made inverse_mdct_slow work); then matching that here
3070	// (probably vorbis encoder premultiplies by n or n/2, to save it on the decoder?)
3071	s = 0.5; // theoretically would be n4
3072
3073	// [[[ note! the s value of 0.5 is compensated for by the B[] in the current code,
3074	// so it needs to use the "old" B values to behave correctly, or else
3075	// set s to 1.0 ]]]
3076	for (i=0; i < n4 ; ++i) buffer[i] = s * X[i+n4];
3077	for ( ; i < n3_4; ++i) buffer[i] = -s * X[n3_4 - i - 1];
3078	for ( ; i < n ; ++i) buffer[i] = -s * X[i - n3_4];
3079	}
3080	#endif
3081
3082	static float get_window(vorb f, int len)
3083	{
3084	len <<= 1;
3085	if (len == f->blocksize_0) return f->window[0];
3086	if (len == f->blocksize_1) return f->window[1];
3087	assert(0)((0) ? (void)0 : _assert("0", "src/siege/internal/stb/stb_vorbis.c" , 3087));
3088	return NULL((void*)0);
3089	}
3090
3091	#ifndef STB_VORBIS_NO_DEFER_FLOOR
3092	typedef int16 YTYPE;
3093	#else
3094	typedef int YTYPE;
3095	#endif
3096	static int do_floor(vorb f, Mapping map, int i, int n, float target, YTYPE finalY, uint8 *step2_flag)
3097	{
3098	int n2 = n >> 1;
3099	int s = map->chan[i].mux, floor;
3100	floor = map->submap_floor[s];
3101	if (f->floor_types[floor] == 0) {
3102	return error(f, VORBIS_invalid_stream);
3103	} else {
3104	Floor1 *g = &f->floor_config[floor].floor1;
3105	int j,q;
3106	int lx = 0, ly = finalY[0] * g->floor1_multiplier;
3107	for (q=1; q < g->values; ++q) {
3108	j = g->sorted_order[q];
3109	#ifndef STB_VORBIS_NO_DEFER_FLOOR
3110	if (finalY[j] >= 0)
3111	#else
3112	if (step2_flag[j])
3113	#endif
3114	{
3115	int hy = finalY[j] * g->floor1_multiplier;
3116	int hx = g->Xlist[j];
3117	draw_line(target, lx,ly, hx,hy, n2);
3118	lx = hx, ly = hy;
3119	}
3120	}
3121	if (lx < n2)
3122	// optimization of: draw_line(target, lx,ly, n,ly, n2);
3123	for (j=lx; j < n2; ++j)
3124	LINE_OP(target[j], inverse_db_table[ly])target[j] *= inverse_db_table[ly];
3125	}
3126	return TRUE1;
3127	}
3128
3129	static int vorbis_decode_initial(vorb f, int p_left_start, int p_left_end, int p_right_start, int p_right_end, int mode)
3130	{
3131	Mode *m;
3132	int i, n, prev, next, window_center;
3133	f->channel_buffer_start = f->channel_buffer_end = 0;
3134
3135	retry:
3136	if (f->eof) return FALSE0;
3137	if (!maybe_start_packet(f))
3138	return FALSE0;
3139	// check packet type
3140	if (get_bits(f,1) != 0) {
3141	if (IS_PUSH_MODE(f)((f)->push_mode))
3142	return error(f,VORBIS_bad_packet_type);
3143	while (EOP(-1) != get8_packet(f));
3144	goto retry;
3145	}
3146
3147	if (f->alloc.alloc_buffer)
3148	assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3148));
3149
3150	i = get_bits(f, ilog(f->mode_count-1));
3151	if (i == EOP(-1)) return FALSE0;
3152	if (i >= f->mode_count) return FALSE0;
3153	*mode = i;
3154	m = f->mode_config + i;
3155	if (m->blockflag) {
3156	n = f->blocksize_1;
3157	prev = get_bits(f,1);
3158	next = get_bits(f,1);
3159	} else {
3160	prev = next = 0;
3161	n = f->blocksize_0;
3162	}
3163
3164	// WINDOWING
3165
3166	window_center = n >> 1;
3167	if (m->blockflag && !prev) {
3168	*p_left_start = (n - f->blocksize_0) >> 2;
3169	*p_left_end = (n + f->blocksize_0) >> 2;
3170	} else {
3171	*p_left_start = 0;
3172	*p_left_end = window_center;
3173	}
3174	if (m->blockflag && !next) {
3175	p_right_start = (n3 - f->blocksize_0) >> 2;
3176	p_right_end = (n3 + f->blocksize_0) >> 2;
3177	} else {
3178	*p_right_start = window_center;
3179	*p_right_end = n;
3180	}
3181	return TRUE1;
3182	}
3183
3184	static int vorbis_decode_packet_rest(vorb f, int len, Mode m, int left_start, int left_end, int right_start, int right_end, int p_left)
3185	{
3186	Mapping *map;
3187	int i,j,k,n,n2;
3188	int zero_channel[256];
3189	int really_zero_channel[256];
3190	int window_center;
3191
3192	// WINDOWING
3193
3194	n = f->blocksize[m->blockflag];
3195	window_center = n >> 1;
3196	(void)window_center;
3197
3198	map = &f->mapping[m->mapping];
3199
3200	// FLOORS
3201	n2 = n >> 1;
3202
3203	stb_prof(1)(void)0;
3204	for (i=0; i < f->channels; ++i) {
3205	int s = map->chan[i].mux, floor;
3206	zero_channel[i] = FALSE0;
3207	floor = map->submap_floor[s];
3208	if (f->floor_types[floor] == 0) {
3209	return error(f, VORBIS_invalid_stream);
3210	} else {
3211	Floor1 *g = &f->floor_config[floor].floor1;
3212	if (get_bits(f, 1)) {
3213	short *finalY;
3214	uint8 step2_flag[256];
3215	static int range_list[4] = { 256, 128, 86, 64 };
3216	int range = range_list[g->floor1_multiplier-1];
3217	int offset = 2;
3218	finalY = f->finalY[i];
3219	finalY[0] = get_bits(f, ilog(range)-1);
3220	finalY[1] = get_bits(f, ilog(range)-1);
3221	for (j=0; j < g->partitions; ++j) {
3222	int pclass = g->partition_class_list[j];
3223	int cdim = g->class_dimensions[pclass];
3224	int cbits = g->class_subclasses[pclass];
3225	int csub = (1 << cbits)-1;
3226	int cval = 0;
3227	if (cbits) {
3228	Codebook *c = f->codebooks + g->class_masterbooks[pclass];
3229	DECODE(cval,f,c)if (f->valid_bits < 10) prep_huffman(f); cval = f->acc & ((1 << 10) - 1); cval = c->fast_huffman[cval] ; if (cval >= 0) { int n = c->codeword_lengths[cval]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; cval = -1; } } else { cval = codebook_decode_scalar_raw(f,c); } if (c->sparse) cval = c ->sorted_values[cval];;
3230	}
3231	for (k=0; k < cdim; ++k) {
3232	int book = g->subclass_books[pclass][cval & csub];
3233	cval = cval >> cbits;
3234	if (book >= 0) {
3235	int temp;
3236	Codebook *c = f->codebooks + book;
3237	DECODE(temp,f,c)if (f->valid_bits < 10) prep_huffman(f); temp = f->acc & ((1 << 10) - 1); temp = c->fast_huffman[temp] ; if (temp >= 0) { int n = c->codeword_lengths[temp]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; temp = -1; } } else { temp = codebook_decode_scalar_raw(f,c); } if (c->sparse) temp = c ->sorted_values[temp];;
3238	finalY[offset++] = temp;
3239	} else
3240	finalY[offset++] = 0;
3241	}
3242	}
3243	if (f->valid_bits == INVALID_BITS(-1)) goto error; // behavior according to spec
3244	step2_flag[0] = step2_flag[1] = 1;
3245	for (j=2; j < g->values; ++j) {
3246	int low, high, pred, highroom, lowroom, room, val;
3247	low = g->neighbors[j][0];
3248	high = g->neighbors[j][1];
3249	//neighbors(g->Xlist, j, &low, &high);
3250	pred = predict_point(g->Xlist[j], g->Xlist[low], g->Xlist[high], finalY[low], finalY[high]);
3251	val = finalY[j];
3252	highroom = range - pred;
3253	lowroom = pred;
3254	if (highroom < lowroom)
3255	room = highroom * 2;
3256	else
3257	room = lowroom * 2;
3258	if (val) {
3259	step2_flag[low] = step2_flag[high] = 1;
3260	step2_flag[j] = 1;
3261	if (val >= room)
3262	if (highroom > lowroom)
3263	finalY[j] = val - lowroom + pred;
3264	else
3265	finalY[j] = pred - val + highroom - 1;
3266	else
3267	if (val & 1)
3268	finalY[j] = pred - ((val+1)>>1);
3269	else
3270	finalY[j] = pred + (val>>1);
3271	} else {
3272	step2_flag[j] = 0;
3273	finalY[j] = pred;
3274	}
3275	}
3276
3277	#ifdef STB_VORBIS_NO_DEFER_FLOOR
3278	do_floor(f, map, i, n, f->floor_buffers[i], finalY, step2_flag);
3279	#else
3280	// defer final floor computation until _after_ residue
3281	for (j=0; j < g->values; ++j) {
3282	if (!step2_flag[j])
3283	finalY[j] = -1;
3284	}
3285	#endif
3286	} else {
3287	error:
3288	zero_channel[i] = TRUE1;
3289	}
3290	// So we just defer everything else to later
3291
3292	// at this point we've decoded the floor into buffer
3293	}
3294	}
3295	stb_prof(0)(void)0;
3296	// at this point we've decoded all floors
3297
3298	if (f->alloc.alloc_buffer)
3299	assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3299));
3300
3301	// re-enable coupled channels if necessary
3302	memcpy(really_zero_channel, zero_channel, sizeof(really_zero_channel[0]) * f->channels);
3303	for (i=0; i < map->coupling_steps; ++i)
3304	if (!zero_channel[map->chan[i].magnitude] \|\| !zero_channel[map->chan[i].angle]) {
3305	zero_channel[map->chan[i].magnitude] = zero_channel[map->chan[i].angle] = FALSE0;
3306	}
3307
3308	// RESIDUE DECODE
3309	for (i=0; i < map->submaps; ++i) {
3310	float *residue_buffers[STB_VORBIS_MAX_CHANNELS16];
3311	int r,t;
3312	uint8 do_not_decode[256];
3313	int ch = 0;
3314	for (j=0; j < f->channels; ++j) {
3315	if (map->chan[j].mux == i) {
3316	if (zero_channel[j]) {
3317	do_not_decode[ch] = TRUE1;
3318	residue_buffers[ch] = NULL((void*)0);
3319	} else {
3320	do_not_decode[ch] = FALSE0;
3321	residue_buffers[ch] = f->channel_buffers[j];
3322	}
3323	++ch;
3324	}
3325	}
3326	r = map->submap_residue[i];
3327	t = f->residue_types[r];
3328	(void)t;
3329	decode_residue(f, residue_buffers, ch, n2, r, do_not_decode);
3330	}
3331
3332	if (f->alloc.alloc_buffer)
3333	assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3333));
3334
3335	// INVERSE COUPLING
3336	stb_prof(14)(void)0;
3337	for (i = map->coupling_steps-1; i >= 0; --i) {
3338	int n2 = n >> 1;
3339	float *m = f->channel_buffers[map->chan[i].magnitude];
3340	float *a = f->channel_buffers[map->chan[i].angle ];
3341	for (j=0; j < n2; ++j) {
3342	float a2,m2;
3343	if (m[j] > 0)
3344	if (a[j] > 0)
3345	m2 = m[j], a2 = m[j] - a[j];
3346	else
3347	a2 = m[j], m2 = m[j] + a[j];
3348	else
3349	if (a[j] > 0)
3350	m2 = m[j], a2 = m[j] + a[j];
3351	else
3352	a2 = m[j], m2 = m[j] - a[j];
3353	m[j] = m2;
3354	a[j] = a2;
3355	}
3356	}
3357
3358	// finish decoding the floors
3359	#ifndef STB_VORBIS_NO_DEFER_FLOOR
3360	stb_prof(15)(void)0;
3361	for (i=0; i < f->channels; ++i) {
3362	if (really_zero_channel[i]) {
3363	memset(f->channel_buffers[i], 0, sizeof(f->channel_buffers[i]) n2);
3364	} else {
3365	do_floor(f, map, i, n, f->channel_buffers[i], f->finalY[i], NULL((void*)0));
3366	}
3367	}
3368	#else
3369	for (i=0; i < f->channels; ++i) {
3370	if (really_zero_channel[i]) {
3371	memset(f->channel_buffers[i], 0, sizeof(f->channel_buffers[i]) n2);
3372	} else {
3373	for (j=0; j < n2; ++j)
3374	f->channel_buffers[i][j] *= f->floor_buffers[i][j];
3375	}
3376	}
3377	#endif
3378
3379	// INVERSE MDCT
3380	stb_prof(16)(void)0;
3381	for (i=0; i < f->channels; ++i)
3382	inverse_mdct(f->channel_buffers[i], n, f, m->blockflag);
3383	stb_prof(0)(void)0;
3384
3385	// this shouldn't be necessary, unless we exited on an error
3386	// and want to flush to get to the next packet
3387	flush_packet(f);
3388
3389	if (f->first_decode) {
3390	// assume we start so first non-discarded sample is sample 0
3391	// this isn't to spec, but spec would require us to read ahead
3392	// and decode the size of all current frames--could be done,
3393	// but presumably it's not a commonly used feature
3394	f->current_loc = -n2; // start of first frame is positioned for discard
3395	// we might have to discard samples "from" the next frame too,
3396	// if we're lapping a large block then a small at the start?
3397	f->discard_samples_deferred = n - right_end;
3398	f->current_loc_valid = TRUE1;
3399	f->first_decode = FALSE0;
3400	} else if (f->discard_samples_deferred) {
3401	left_start += f->discard_samples_deferred;
3402	*p_left = left_start;
3403	f->discard_samples_deferred = 0;
3404	} else if (f->previous_length == 0 && f->current_loc_valid) {
3405	// we're recovering from a seek... that means we're going to discard
3406	// the samples from this packet even though we know our position from
3407	// the last page header, so we need to update the position based on
3408	// the discarded samples here
3409	// but wait, the code below is going to add this in itself even
3410	// on a discard, so we don't need to do it here...
3411	}
3412
3413	// check if we have ogg information about the sample # for this packet
3414	if (f->last_seg_which == f->end_seg_with_known_loc) {
3415	// if we have a valid current loc, and this is final:
3416	if (f->current_loc_valid && (f->page_flag & PAGEFLAG_last_page4)) {
3417	uint32 current_end = f->known_loc_for_packet - (n-right_end);
3418	// then let's infer the size of the (probably) short final frame
3419	if (current_end < f->current_loc + right_end) {
3420	if (current_end < f->current_loc) {
3421	// negative truncation, that's impossible!
3422	*len = 0;
3423	} else {
3424	*len = current_end - f->current_loc;
3425	}
3426	*len += left_start;
3427	f->current_loc += *len;
3428	return TRUE1;
3429	}
3430	}
3431	// otherwise, just set our sample loc
3432	// guess that the ogg granule pos refers to the _middle_ of the
3433	// last frame?
3434	// set f->current_loc to the position of left_start
3435	f->current_loc = f->known_loc_for_packet - (n2-left_start);
3436	f->current_loc_valid = TRUE1;
3437	}
3438	if (f->current_loc_valid)
3439	f->current_loc += (right_start - left_start);
3440
3441	if (f->alloc.alloc_buffer)
3442	assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3442));
3443	*len = right_end; // ignore samples after the window goes to 0
3444	return TRUE1;
3445	}
3446
3447	static int vorbis_decode_packet(vorb f, int len, int p_left, int p_right)
3448	{
3449	int mode, left_end, right_end;
3450	if (!vorbis_decode_initial(f, p_left, &left_end, p_right, &right_end, &mode)) return 0;
3451	return vorbis_decode_packet_rest(f, len, f->mode_config + mode, p_left, left_end, p_right, right_end, p_left);
3452	}
3453
3454	static int vorbis_finish_frame(stb_vorbis *f, int len, int left, int right)
3455	{
3456	int prev,i,j;
3457	// we use right&left (the start of the right- and left-window sin()-regions)
3458	// to determine how much to return, rather than inferring from the rules
3459	// (same result, clearer code); 'left' indicates where our sin() window
3460	// starts, therefore where the previous window's right edge starts, and
3461	// therefore where to start mixing from the previous buffer. 'right'
3462	// indicates where our sin() ending-window starts, therefore that's where
3463	// we start saving, and where our returned-data ends.
3464
3465	// mixin from previous window
3466	if (f->previous_length) {
3467	int i,j, n = f->previous_length;
3468	float *w = get_window(f, n);
3469	for (i=0; i < f->channels; ++i) {
3470	for (j=0; j < n; ++j)
3471	f->channel_buffers[i][left+j] =
3472	f->channel_buffers[i][left+j]*w[ j] +
3473	f->previous_window[i][ j]*w[n-1-j];
3474	}
3475	}
3476
3477	prev = f->previous_length;
3478
3479	// last half of this data becomes previous window
3480	f->previous_length = len - right;
3481
3482	// @OPTIMIZE: could avoid this copy by double-buffering the
3483	// output (flipping previous_window with channel_buffers), but
3484	// then previous_window would have to be 2x as large, and
3485	// channel_buffers couldn't be temp mem (although they're NOT
3486	// currently temp mem, they could be (unless we want to level
3487	// performance by spreading out the computation))
3488	for (i=0; i < f->channels; ++i)
3489	for (j=0; right+j < len; ++j)
3490	f->previous_window[i][j] = f->channel_buffers[i][right+j];
3491
3492	if (!prev)
3493	// there was no previous packet, so this data isn't valid...
3494	// this isn't entirely true, only the would-have-overlapped data
3495	// isn't valid, but this seems to be what the spec requires
3496	return 0;
3497
3498	// truncate a short frame
3499	if (len < right) right = len;
3500
3501	f->samples_output += right-left;
3502
3503	return right - left;
3504	}
3505
3506	static void vorbis_pump_first_frame(stb_vorbis *f)
3507	{
3508	int len, right, left;
3509	if (vorbis_decode_packet(f, &len, &left, &right))
3510	vorbis_finish_frame(f, len, left, right);
3511	}
3512
3513	#ifndef STB_VORBIS_NO_PUSHDATA_API
3514	static int is_whole_packet_present(stb_vorbis *f, int end_page)
3515	{
3516	// make sure that we have the packet available before continuing...
3517	// this requires a full ogg parse, but we know we can fetch from f->stream
3518
3519	// instead of coding this out explicitly, we could save the current read state,
3520	// read the next packet with get8() until end-of-packet, check f->eof, then
3521	// reset the state? but that would be slower, esp. since we'd have over 256 bytes
3522	// of state to restore (primarily the page segment table)
3523
3524	int s = f->next_seg, first = TRUE1;
3525	uint8 *p = f->stream;
3526
3527	if (s != -1) { // if we're not starting the packet with a 'continue on next page' flag
3528	for (; s < f->segment_count; ++s) {
3529	p += f->segments[s];
3530	if (f->segments[s] < 255) // stop at first short segment
3531	break;
3532	}
3533	// either this continues, or it ends it...
3534	if (end_page)
3535	if (s < f->segment_count-1) return error(f, VORBIS_invalid_stream);
3536	if (s == f->segment_count)
3537	s = -1; // set 'crosses page' flag
3538	if (p > f->stream_end) return error(f, VORBIS_need_more_data);
3539	first = FALSE0;
3540	}
3541	for (; s == -1;) {
3542	uint8 *q;
3543	int n;
3544
3545	// check that we have the page header ready
3546	if (p + 26 >= f->stream_end) return error(f, VORBIS_need_more_data);
3547	// validate the page
3548	if (memcmp(p, ogg_page_header, 4)) return error(f, VORBIS_invalid_stream);
3549	if (p[4] != 0) return error(f, VORBIS_invalid_stream);
3550	if (first) { // the first segment must NOT have 'continued_packet', later ones MUST
3551	if (f->previous_length)
3552	if ((p[5] & PAGEFLAG_continued_packet1)) return error(f, VORBIS_invalid_stream);
3553	// if no previous length, we're resynching, so we can come in on a continued-packet,
3554	// which we'll just drop
3555	} else {
3556	if (!(p[5] & PAGEFLAG_continued_packet1)) return error(f, VORBIS_invalid_stream);
3557	}
3558	n = p[26]; // segment counts
3559	q = p+27; // q points to segment table
3560	p = q + n; // advance past header
3561	// make sure we've read the segment table
3562	if (p > f->stream_end) return error(f, VORBIS_need_more_data);
3563	for (s=0; s < n; ++s) {
3564	p += q[s];
3565	if (q[s] < 255)
3566	break;
3567	}
3568	if (end_page)
3569	if (s < n-1) return error(f, VORBIS_invalid_stream);
3570	if (s == f->segment_count)
3571	s = -1; // set 'crosses page' flag
3572	if (p > f->stream_end) return error(f, VORBIS_need_more_data);
3573	first = FALSE0;
3574	}
3575	return TRUE1;
3576	}
3577	#endif // !STB_VORBIS_NO_PUSHDATA_API
3578
3579	static int start_decoder(vorb *f)
3580	{
3581	uint8 header[6], x,y;
3582	int len,i,j,k, max_submaps = 0;
3583	int longest_floorlist=0;
3584
3585	// first page, first packet
3586
3587	if (!start_page(f)) return FALSE0;
3588	// validate page flag
3589	if (!(f->page_flag & PAGEFLAG_first_page2)) return error(f, VORBIS_invalid_first_page);
3590	if (f->page_flag & PAGEFLAG_last_page4) return error(f, VORBIS_invalid_first_page);
3591	if (f->page_flag & PAGEFLAG_continued_packet1) return error(f, VORBIS_invalid_first_page);
3592	// check for expected packet length
3593	if (f->segment_count != 1) return error(f, VORBIS_invalid_first_page);
3594	if (f->segments[0] != 30) return error(f, VORBIS_invalid_first_page);
3595	// read packet
3596	// check packet header
3597	if (get8(f) != VORBIS_packet_id) return error(f, VORBIS_invalid_first_page);
3598	if (!getn(f, header, 6)) return error(f, VORBIS_unexpected_eof);
3599	if (!vorbis_validate(header)) return error(f, VORBIS_invalid_first_page);
3600	// vorbis_version
3601	if (get32(f) != 0) return error(f, VORBIS_invalid_first_page);
3602	f->channels = get8(f); if (!f->channels) return error(f, VORBIS_invalid_first_page);
3603	if (f->channels > STB_VORBIS_MAX_CHANNELS16) return error(f, VORBIS_too_many_channels);
3604	f->sample_rate = get32(f); if (!f->sample_rate) return error(f, VORBIS_invalid_first_page);
3605	get32(f); // bitrate_maximum
3606	get32(f); // bitrate_nominal
3607	get32(f); // bitrate_minimum
3608	x = get8(f);
3609	{ int log0,log1;
3610	log0 = x & 15;
3611	log1 = x >> 4;
3612	f->blocksize_0 = 1 << log0;
3613	f->blocksize_1 = 1 << log1;
3614	if (log0 < 6 \|\| log0 > 13) return error(f, VORBIS_invalid_setup);
3615	if (log1 < 6 \|\| log1 > 13) return error(f, VORBIS_invalid_setup);
3616	if (log0 > log1) return error(f, VORBIS_invalid_setup);
3617	}
3618
3619	// framing_flag
3620	x = get8(f);
3621	if (!(x & 1)) return error(f, VORBIS_invalid_first_page);
3622
3623	// second packet!
3624	if (!start_page(f)) return FALSE0;
3625
3626	if (!start_packet(f)) return FALSE0;
3627	do {
3628	len = next_segment(f);
3629	skip(f, len);
3630	f->bytes_in_seg = 0;
3631	} while (len);
3632
3633	// third packet!
3634	if (!start_packet(f)) return FALSE0;
3635
3636	#ifndef STB_VORBIS_NO_PUSHDATA_API
3637	if (IS_PUSH_MODE(f)((f)->push_mode)) {
3638	if (!is_whole_packet_present(f, TRUE1)) {
3639	// convert error in ogg header to write type
3640	if (f->error == VORBIS_invalid_stream)
3641	f->error = VORBIS_invalid_setup;
3642	return FALSE0;
3643	}
3644	}
3645	#endif
3646
3647	crc32_init(); // always init it, to avoid multithread race conditions
3648
3649	if (get8_packet(f) != VORBIS_packet_setup) return error(f, VORBIS_invalid_setup);
3650	for (i=0; i < 6; ++i) header[i] = get8_packet(f);
3651	if (!vorbis_validate(header)) return error(f, VORBIS_invalid_setup);
3652
3653	// codebooks
3654
3655	f->codebook_count = get_bits(f,8) + 1;
3656	f->codebooks = (Codebook ) setup_malloc(f, sizeof(f->codebooks) * f->codebook_count);
3657	if (f->codebooks == NULL((void*)0)) return error(f, VORBIS_outofmem);
3658	memset(f->codebooks, 0, sizeof(f->codebooks) f->codebook_count);
3659	for (i=0; i < f->codebook_count; ++i) {
3660	uint32 *values;
3661	int ordered, sorted_count;
3662	int total=0;
3663	uint8 *lengths;
3664	Codebook *c = f->codebooks+i;
3665	x = get_bits(f, 8); if (x != 0x42) return error(f, VORBIS_invalid_setup);
3666	x = get_bits(f, 8); if (x != 0x43) return error(f, VORBIS_invalid_setup);
3667	x = get_bits(f, 8); if (x != 0x56) return error(f, VORBIS_invalid_setup);
3668	x = get_bits(f, 8);
3669	c->dimensions = (get_bits(f, 8)<<8) + x;
3670	x = get_bits(f, 8);
3671	y = get_bits(f, 8);
3672	c->entries = (get_bits(f, 8)<<16) + (y<<8) + x;
3673	ordered = get_bits(f,1);
3674	c->sparse = ordered ? 0 : get_bits(f,1);
3675
3676	if (c->sparse)
3677	lengths = (uint8 *) setup_temp_malloc(f, c->entries);
3678	else
3679	lengths = c->codeword_lengths = (uint8 *) setup_malloc(f, c->entries);
3680
3681	if (!lengths) return error(f, VORBIS_outofmem);
3682
3683	if (ordered) {
3684	int current_entry = 0;
3685	int current_length = get_bits(f,5) + 1;
3686	while (current_entry < c->entries) {
3687	int limit = c->entries - current_entry;
3688	int n = get_bits(f, ilog(limit));
3689	if (current_entry + n > (int) c->entries) { return error(f, VORBIS_invalid_setup); }
3690	memset(lengths + current_entry, current_length, n);
3691	current_entry += n;
3692	++current_length;
3693	}
3694	} else {
3695	for (j=0; j < c->entries; ++j) {
3696	int present = c->sparse ? get_bits(f,1) : 1;
3697	if (present) {
3698	lengths[j] = get_bits(f, 5) + 1;
3699	++total;
3700	} else {
3701	lengths[j] = NO_CODE255;
3702	}
3703	}
3704	}
3705
3706	if (c->sparse && total >= c->entries >> 2) {
3707	// convert sparse items to non-sparse!
3708	if (c->entries > (int) f->setup_temp_memory_required)
3709	f->setup_temp_memory_required = c->entries;
3710
3711	c->codeword_lengths = (uint8 *) setup_malloc(f, c->entries);
3712	memcpy(c->codeword_lengths, lengths, c->entries);
3713	setup_temp_free(f, lengths, c->entries); // note this is only safe if there have been no intervening temp mallocs!
3714	lengths = c->codeword_lengths;
3715	c->sparse = 0;
3716	}
3717
3718	// compute the size of the sorted tables
3719	if (c->sparse) {
3720	sorted_count = total;
3721	//assert(total != 0);
3722	} else {
3723	sorted_count = 0;
3724	#ifndef STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH
3725	for (j=0; j < c->entries; ++j)
3726	if (lengths[j] > STB_VORBIS_FAST_HUFFMAN_LENGTH10 && lengths[j] != NO_CODE255)
3727	++sorted_count;
3728	#endif
3729	}
3730
3731	c->sorted_entries = sorted_count;
3732	values = NULL((void*)0);
3733
3734	if (!c->sparse) {
3735	c->codewords = (uint32 ) setup_malloc(f, sizeof(c->codewords[0]) c->entries);
3736	if (!c->codewords) return error(f, VORBIS_outofmem);
3737	} else {
3738	unsigned int size;
3739	if (c->sorted_entries) {
3740	c->codeword_lengths = (uint8 *) setup_malloc(f, c->sorted_entries);
3741	if (!c->codeword_lengths) return error(f, VORBIS_outofmem);
3742	c->codewords = (uint32 ) setup_temp_malloc(f, sizeof(c->codewords) * c->sorted_entries);
3743	if (!c->codewords) return error(f, VORBIS_outofmem);
3744	values = (uint32 ) setup_temp_malloc(f, sizeof(values) * c->sorted_entries);
3745	if (!values) return error(f, VORBIS_outofmem);
3746	}
3747	size = c->entries + (sizeof(c->codewords) + sizeof(values)) * c->sorted_entries;
3748	if (size > f->setup_temp_memory_required)
3749	f->setup_temp_memory_required = size;
3750	}
3751
3752	if (!compute_codewords(c, lengths, c->entries, values)) {
3753	if (c->sparse) setup_temp_free(f, values, 0);
3754	return error(f, VORBIS_invalid_setup);
3755	}
3756
3757	if (c->sorted_entries) {
3758	// allocate an extra slot for sentinels
3759	c->sorted_codewords = (uint32 ) setup_malloc(f, sizeof(c->sorted_codewords) * (c->sorted_entries+1));
3760	// allocate an extra slot at the front so that c->sorted_values[-1] is defined
3761	// so that we can catch that case without an extra if
3762	c->sorted_values = ( int ) setup_malloc(f, sizeof(c->sorted_values ) * (c->sorted_entries+1));
3763	if (c->sorted_values) { ++c->sorted_values; c->sorted_values[-1] = -1; }
3764	compute_sorted_huffman(c, lengths, values);
3765	}
3766
3767	if (c->sparse) {
3768	setup_temp_free(f, values, sizeof(values)c->sorted_entries);
3769	setup_temp_free(f, c->codewords, sizeof(c->codewords)c->sorted_entries);
3770	setup_temp_free(f, lengths, c->entries);
3771	c->codewords = NULL((void*)0);
3772	}
3773
3774	compute_accelerated_huffman(c);
3775
3776	c->lookup_type = get_bits(f, 4);
3777	if (c->lookup_type > 2) return error(f, VORBIS_invalid_setup);
3778	if (c->lookup_type > 0) {
3779	uint16 *mults;
3780	c->minimum_value = float32_unpack(get_bits(f, 32));
3781	c->delta_value = float32_unpack(get_bits(f, 32));
3782	c->value_bits = get_bits(f, 4)+1;
3783	c->sequence_p = get_bits(f,1);
3784	if (c->lookup_type == 1) {
3785	c->lookup_values = lookup1_values(c->entries, c->dimensions);
3786	} else {
3787	c->lookup_values = c->entries * c->dimensions;
3788	}
3789	mults = (uint16 ) setup_temp_malloc(f, sizeof(mults[0]) c->lookup_values);
3790	if (mults == NULL((void*)0)) return error(f, VORBIS_outofmem);
3791	for (j=0; j < (int) c->lookup_values; ++j) {
3792	int q = get_bits(f, c->value_bits);
3793	if (q == EOP(-1)) { setup_temp_free(f,mults,sizeof(mults[0])*c->lookup_values); return error(f, VORBIS_invalid_setup); }
3794	mults[j] = q;
3795	}
3796
3797	#ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK
3798	if (c->lookup_type == 1) {
3799	int len, sparse = c->sparse;
3800	// pre-expand the lookup1-style multiplicands, to avoid a divide in the inner loop
3801	if (sparse) {
3802	if (c->sorted_entries == 0) goto skip;
3803	c->multiplicands = (codetype ) setup_malloc(f, sizeof(c->multiplicands[0]) c->sorted_entries * c->dimensions);
3804	} else
3805	c->multiplicands = (codetype ) setup_malloc(f, sizeof(c->multiplicands[0]) c->entries * c->dimensions);
3806	if (c->multiplicands == NULL((void)0)) { setup_temp_free(f,mults,sizeof(mults[0])c->lookup_values); return error(f, VORBIS_outofmem); }
3807	len = sparse ? c->sorted_entries : c->entries;
3808	for (j=0; j < len; ++j) {
3809	int z = sparse ? c->sorted_values[j] : j, div=1;
3810	for (k=0; k < c->dimensions; ++k) {
3811	int off = (z / div) % c->lookup_values;
3812	c->multiplicands[j*c->dimensions + k] =
3813	#ifndef STB_VORBIS_CODEBOOK_FLOATS
3814	mults[off];
3815	#else
3816	mults[off]*c->delta_value + c->minimum_value;
3817	// in this case (and this case only) we could pre-expand c->sequence_p,
3818	// and throw away the decode logic for it; have to ALSO do
3819	// it in the case below, but it can only be done if
3820	// STB_VORBIS_CODEBOOK_FLOATS
3821	// !STB_VORBIS_DIVIDES_IN_CODEBOOK
3822	#endif
3823	div *= c->lookup_values;
3824	}
3825	}
3826	setup_temp_free(f, mults,sizeof(mults[0])*c->lookup_values);
3827	c->lookup_type = 2;
3828	}
3829	else
3830	#endif
3831	{
3832	c->multiplicands = (codetype ) setup_malloc(f, sizeof(c->multiplicands[0]) c->lookup_values);
3833	#ifndef STB_VORBIS_CODEBOOK_FLOATS
3834	memcpy(c->multiplicands, mults, sizeof(c->multiplicands[0]) * c->lookup_values);
3835	#else
3836	for (j=0; j < (int) c->lookup_values; ++j)
3837	c->multiplicands[j] = mults[j] * c->delta_value + c->minimum_value;
3838	setup_temp_free(f, mults,sizeof(mults[0])*c->lookup_values);
3839	#endif
3840	}
3841	skip:;
3842
3843	#ifdef STB_VORBIS_CODEBOOK_FLOATS
3844	if (c->lookup_type == 2 && c->sequence_p) {
3845	for (j=1; j < (int) c->lookup_values; ++j)
3846	c->multiplicands[j] = c->multiplicands[j-1];
3847	c->sequence_p = 0;
3848	}
3849	#endif
3850	}
3851	}
3852
3853	// time domain transfers (notused)
3854
3855	x = get_bits(f, 6) + 1;
3856	for (i=0; i < x; ++i) {
3857	uint32 z = get_bits(f, 16);
3858	if (z != 0) return error(f, VORBIS_invalid_setup);
3859	}
3860
3861	// Floors
3862	f->floor_count = get_bits(f, 6)+1;
3863	f->floor_config = (Floor ) setup_malloc(f, f->floor_count sizeof(*f->floor_config));
3864	for (i=0; i < f->floor_count; ++i) {
3865	f->floor_types[i] = get_bits(f, 16);
3866	if (f->floor_types[i] > 1) return error(f, VORBIS_invalid_setup);
3867	if (f->floor_types[i] == 0) {
3868	Floor0 *g = &f->floor_config[i].floor0;
3869	g->order = get_bits(f,8);
3870	g->rate = get_bits(f,16);
3871	g->bark_map_size = get_bits(f,16);
3872	g->amplitude_bits = get_bits(f,6);
3873	g->amplitude_offset = get_bits(f,8);
3874	g->number_of_books = get_bits(f,4) + 1;
3875	for (j=0; j < g->number_of_books; ++j)
3876	g->book_list[j] = get_bits(f,8);
3877	return error(f, VORBIS_feature_not_supported);
3878	} else {
3879	Point p[31*8+2];
3880	Floor1 *g = &f->floor_config[i].floor1;
3881	int max_class = -1;
3882	g->partitions = get_bits(f, 5);
3883	for (j=0; j < g->partitions; ++j) {
3884	g->partition_class_list[j] = get_bits(f, 4);
3885	if (g->partition_class_list[j] > max_class)
3886	max_class = g->partition_class_list[j];
3887	}
3888	for (j=0; j <= max_class; ++j) {
3889	g->class_dimensions[j] = get_bits(f, 3)+1;
3890	g->class_subclasses[j] = get_bits(f, 2);
3891	if (g->class_subclasses[j]) {
3892	g->class_masterbooks[j] = get_bits(f, 8);
3893	if (g->class_masterbooks[j] >= f->codebook_count) return error(f, VORBIS_invalid_setup);
3894	}
3895	for (k=0; k < 1 << g->class_subclasses[j]; ++k) {
3896	g->subclass_books[j][k] = get_bits(f,8)-1;
3897	if (g->subclass_books[j][k] >= f->codebook_count) return error(f, VORBIS_invalid_setup);
3898	}
3899	}
3900	g->floor1_multiplier = get_bits(f,2)+1;
3901	g->rangebits = get_bits(f,4);
3902	g->Xlist[0] = 0;
3903	g->Xlist[1] = 1 << g->rangebits;
3904	g->values = 2;
3905	for (j=0; j < g->partitions; ++j) {
3906	int c = g->partition_class_list[j];
3907	for (k=0; k < g->class_dimensions[c]; ++k) {
3908	g->Xlist[g->values] = get_bits(f, g->rangebits);
3909	++g->values;
3910	}
3911	}
3912	// precompute the sorting
3913	for (j=0; j < g->values; ++j) {
3914	p[j].x = g->Xlist[j];
3915	p[j].y = j;
3916	}
3917	qsort(p, g->values, sizeof(p[0]), point_compare);
3918	for (j=0; j < g->values; ++j)
3919	g->sorted_order[j] = (uint8) p[j].y;
3920	// precompute the neighbors
3921	for (j=2; j < g->values; ++j) {
3922	int low,hi;
3923	neighbors(g->Xlist, j, &low,&hi);
3924	g->neighbors[j][0] = low;
3925	g->neighbors[j][1] = hi;
3926	}
3927
3928	if (g->values > longest_floorlist)
3929	longest_floorlist = g->values;
3930	}
3931	}
3932
3933	// Residue
3934	f->residue_count = get_bits(f, 6)+1;
3935	f->residue_config = (Residue ) setup_malloc(f, f->residue_count sizeof(*f->residue_config));
3936	for (i=0; i < f->residue_count; ++i) {
3937	uint8 residue_cascade[64];
3938	Residue *r = f->residue_config+i;
3939	f->residue_types[i] = get_bits(f, 16);
3940	if (f->residue_types[i] > 2) return error(f, VORBIS_invalid_setup);
3941	r->begin = get_bits(f, 24);
3942	r->end = get_bits(f, 24);
3943	r->part_size = get_bits(f,24)+1;
3944	r->classifications = get_bits(f,6)+1;
3945	r->classbook = get_bits(f,8);
3946	for (j=0; j < r->classifications; ++j) {
3947	uint8 high_bits=0;
3948	uint8 low_bits=get_bits(f,3);
3949	if (get_bits(f,1))
3950	high_bits = get_bits(f,5);
3951	residue_cascade[j] = high_bits*8 + low_bits;
3952	}
3953	r->residue_books = (short ()[8]) setup_malloc(f, sizeof(r->residue_books[0]) r->classifications);
3954	for (j=0; j < r->classifications; ++j) {
3955	for (k=0; k < 8; ++k) {
3956	if (residue_cascade[j] & (1 << k)) {
3957	r->residue_books[j][k] = get_bits(f, 8);
3958	if (r->residue_books[j][k] >= f->codebook_count) return error(f, VORBIS_invalid_setup);
3959	} else {
3960	r->residue_books[j][k] = -1;
3961	}
3962	}
3963	}
3964	// precompute the classifications[] array to avoid inner-loop mod/divide
3965	// call it 'classdata' since we already have r->classifications
3966	r->classdata = (uint8 *) setup_malloc(f, sizeof(r->classdata) * f->codebooks[r->classbook].entries);
3967	if (!r->classdata) return error(f, VORBIS_outofmem);
3968	memset(r->classdata, 0, sizeof(r->classdata) f->codebooks[r->classbook].entries);
3969	for (j=0; j < f->codebooks[r->classbook].entries; ++j) {
3970	int classwords = f->codebooks[r->classbook].dimensions;
3971	int temp = j;
3972	r->classdata[j] = (uint8 ) setup_malloc(f, sizeof(r->classdata[j][0]) classwords);
3973	for (k=classwords-1; k >= 0; --k) {
3974	r->classdata[j][k] = temp % r->classifications;
3975	temp /= r->classifications;
3976	}
3977	}
3978	}
3979
3980	f->mapping_count = get_bits(f,6)+1;
3981	f->mapping = (Mapping ) setup_malloc(f, f->mapping_count sizeof(*f->mapping));
3982	for (i=0; i < f->mapping_count; ++i) {
3983	Mapping *m = f->mapping + i;
3984	int mapping_type = get_bits(f,16);
3985	if (mapping_type != 0) return error(f, VORBIS_invalid_setup);
3986	m->chan = (MappingChannel ) setup_malloc(f, f->channels sizeof(*m->chan));
3987	if (get_bits(f,1))
3988	m->submaps = get_bits(f,4);
3989	else
3990	m->submaps = 1;
3991	if (m->submaps > max_submaps)
3992	max_submaps = m->submaps;
3993	if (get_bits(f,1)) {
3994	m->coupling_steps = get_bits(f,8)+1;
3995	for (k=0; k < m->coupling_steps; ++k) {
3996	m->chan[k].magnitude = get_bits(f, ilog(f->channels)-1);
3997	m->chan[k].angle = get_bits(f, ilog(f->channels)-1);
3998	if (m->chan[k].magnitude >= f->channels) return error(f, VORBIS_invalid_setup);
3999	if (m->chan[k].angle >= f->channels) return error(f, VORBIS_invalid_setup);
4000	if (m->chan[k].magnitude == m->chan[k].angle) return error(f, VORBIS_invalid_setup);
4001	}
4002	} else
4003	m->coupling_steps = 0;
4004
4005	// reserved field
4006	if (get_bits(f,2)) return error(f, VORBIS_invalid_setup);
4007	if (m->submaps > 1) {
4008	for (j=0; j < f->channels; ++j) {
4009	m->chan[j].mux = get_bits(f, 4);
4010	if (m->chan[j].mux >= m->submaps) return error(f, VORBIS_invalid_setup);
4011	}
4012	} else
4013	// @SPECIFICATION: this case is missing from the spec
4014	for (j=0; j < f->channels; ++j)
4015	m->chan[j].mux = 0;
4016
4017	for (j=0; j < m->submaps; ++j) {
4018	get_bits(f,8); // discard
4019	m->submap_floor[j] = get_bits(f,8);
4020	m->submap_residue[j] = get_bits(f,8);
4021	if (m->submap_floor[j] >= f->floor_count) return error(f, VORBIS_invalid_setup);
4022	if (m->submap_residue[j] >= f->residue_count) return error(f, VORBIS_invalid_setup);
4023	}
4024	}
4025
4026	// Modes
4027	f->mode_count = get_bits(f, 6)+1;
4028	for (i=0; i < f->mode_count; ++i) {
4029	Mode *m = f->mode_config+i;
4030	m->blockflag = get_bits(f,1);
4031	m->windowtype = get_bits(f,16);
4032	m->transformtype = get_bits(f,16);
4033	m->mapping = get_bits(f,8);
4034	if (m->windowtype != 0) return error(f, VORBIS_invalid_setup);
4035	if (m->transformtype != 0) return error(f, VORBIS_invalid_setup);
4036	if (m->mapping >= f->mapping_count) return error(f, VORBIS_invalid_setup);
4037	}
4038
4039	flush_packet(f);
4040
4041	f->previous_length = 0;
4042
4043	for (i=0; i < f->channels; ++i) {
4044	f->channel_buffers[i] = (float ) setup_malloc(f, sizeof(float) f->blocksize_1);
4045	f->previous_window[i] = (float ) setup_malloc(f, sizeof(float) f->blocksize_1/2);
4046	f->finalY[i] = (int16 ) setup_malloc(f, sizeof(int16) longest_floorlist);
4047	#ifdef STB_VORBIS_NO_DEFER_FLOOR
4048	f->floor_buffers[i] = (float ) setup_malloc(f, sizeof(float) f->blocksize_1/2);
4049	#endif
4050	}
4051
4052	if (!init_blocksize(f, 0, f->blocksize_0)) return FALSE0;
4053	if (!init_blocksize(f, 1, f->blocksize_1)) return FALSE0;
4054	f->blocksize[0] = f->blocksize_0;
4055	f->blocksize[1] = f->blocksize_1;
4056
4057	#ifdef STB_VORBIS_DIVIDE_TABLE
4058	if (integer_divide_table[1][1]==0)
4059	for (i=0; i < DIVTAB_NUMER; ++i)
4060	for (j=1; j < DIVTAB_DENOM; ++j)
4061	integer_divide_table[i][j] = i / j;
4062	#endif
4063
4064	// compute how much temporary memory is needed
4065
4066	// 1.
4067	{
4068	uint32 imdct_mem = (f->blocksize_1 * sizeof(float) >> 1);
4069	uint32 classify_mem;
4070	int i,max_part_read=0;
4071	for (i=0; i < f->residue_count; ++i) {
4072	Residue *r = f->residue_config + i;
4073	int n_read = r->end - r->begin;
4074	int part_read = n_read / r->part_size;
4075	if (part_read > max_part_read)
4076	max_part_read = part_read;
4077	}
4078	#ifndef STB_VORBIS_DIVIDES_IN_RESIDUE
4079	classify_mem = f->channels * (sizeof(void) + max_part_read sizeof(uint8 *));
4080	#else
4081	classify_mem = f->channels * (sizeof(void) + max_part_read sizeof(int *));
4082	#endif
4083
4084	f->temp_memory_required = classify_mem;
4085	if (imdct_mem > f->temp_memory_required)
4086	f->temp_memory_required = imdct_mem;
4087	}
4088
4089	f->first_decode = TRUE1;
4090
4091	if (f->alloc.alloc_buffer) {
4092	assert(f->temp_offset == f->alloc.alloc_buffer_length_in_bytes)((f->temp_offset == f->alloc.alloc_buffer_length_in_bytes ) ? (void)0 : _assert("f->temp_offset == f->alloc.alloc_buffer_length_in_bytes" , "src/siege/internal/stb/stb_vorbis.c", 4092));
4093	// check if there's enough temp memory so we don't error later
4094	if (f->setup_offset + sizeof(*f) + f->temp_memory_required > (unsigned) f->temp_offset)
4095	return error(f, VORBIS_outofmem);
4096	}
4097
4098	f->first_audio_page_offset = stb_vorbis_get_file_offset(f);
4099
4100	return TRUE1;
4101	}
4102
4103	static void vorbis_deinit(stb_vorbis *p)
4104	{
4105	int i,j;
4106	for (i=0; i < p->residue_count; ++i) {
4107	Residue *r = p->residue_config+i;
4108	if (r->classdata) {
4109	for (j=0; j < p->codebooks[r->classbook].entries; ++j)
4110	setup_free(p, r->classdata[j]);
4111	setup_free(p, r->classdata);
4112	}
4113	setup_free(p, r->residue_books);
4114	}
4115
4116	if (p->codebooks) {
4117	for (i=0; i < p->codebook_count; ++i) {
4118	Codebook *c = p->codebooks + i;
4119	setup_free(p, c->codeword_lengths);
4120	setup_free(p, c->multiplicands);
4121	setup_free(p, c->codewords);
4122	setup_free(p, c->sorted_codewords);
4123	// c->sorted_values[-1] is the first entry in the array
4124	setup_free(p, c->sorted_values ? c->sorted_values-1 : NULL((void*)0));
4125	}
4126	setup_free(p, p->codebooks);
4127	}
4128	setup_free(p, p->floor_config);
4129	setup_free(p, p->residue_config);
4130	for (i=0; i < p->mapping_count; ++i)
4131	setup_free(p, p->mapping[i].chan);
4132	setup_free(p, p->mapping);
4133	for (i=0; i < p->channels; ++i) {
4134	setup_free(p, p->channel_buffers[i]);
4135	setup_free(p, p->previous_window[i]);
4136	#ifdef STB_VORBIS_NO_DEFER_FLOOR
4137	setup_free(p, p->floor_buffers[i]);
4138	#endif
4139	setup_free(p, p->finalY[i]);
4140	}
4141	for (i=0; i < 2; ++i) {
4142	setup_free(p, p->A[i]);
4143	setup_free(p, p->B[i]);
4144	setup_free(p, p->C(2 \| 4 \| 1)[i]);
4145	setup_free(p, p->window[i]);
4146	}
4147	#ifndef STB_VORBIS_NO_STDIO
4148	if (p->close_on_free) fclose(p->f);
4149	#endif
4150	}
4151
4152	void stb_vorbis_close(stb_vorbis *p)
4153	{
4154	if (p == NULL((void*)0)) return;
4155	vorbis_deinit(p);
4156	setup_free(p,p);
4157	}
4158
4159	static void vorbis_init(stb_vorbis p, stb_vorbis_alloc z)
4160	{
4161	memset(p, 0, sizeof(*p)); // NULL out all malloc'd pointers to start
4162	if (z) {
4163	p->alloc = *z;
4164	p->alloc.alloc_buffer_length_in_bytes = (p->alloc.alloc_buffer_length_in_bytes+3) & ~3;
4165	p->temp_offset = p->alloc.alloc_buffer_length_in_bytes;
4166	}
4167	p->eof = 0;
4168	p->error = VORBIS__no_error;
4169	p->stream = NULL((void*)0);
4170	p->codebooks = NULL((void*)0);
4171	p->page_crc_tests = -1;
4172	#ifndef STB_VORBIS_NO_STDIO
4173	p->close_on_free = FALSE0;
4174	p->f = NULL((void*)0);
4175	#endif
4176	}
4177
4178	int stb_vorbis_get_sample_offset(stb_vorbis *f)
4179	{
4180	if (f->current_loc_valid)
4181	return f->current_loc;
4182	else
4183	return -1;
4184	}
4185
4186	stb_vorbis_info stb_vorbis_get_info(stb_vorbis *f)
4187	{
4188	stb_vorbis_info d;
4189	d.channels = f->channels;
4190	d.sample_rate = f->sample_rate;
4191	d.setup_memory_required = f->setup_memory_required;
4192	d.setup_temp_memory_required = f->setup_temp_memory_required;
4193	d.temp_memory_required = f->temp_memory_required;
4194	d.max_frame_size = f->blocksize_1 >> 1;
4195	return d;
4196	}
4197
4198	int stb_vorbis_get_error(stb_vorbis *f)
4199	{
4200	int e = f->error;
4201	f->error = VORBIS__no_error;
4202	return e;
4203	}
4204
4205	static stb_vorbis * vorbis_alloc(stb_vorbis *f)
4206	{
4207	stb_vorbis p = (stb_vorbis ) setup_malloc(f, sizeof(*p));
4208	return p;
4209	}
4210
4211	#ifndef STB_VORBIS_NO_PUSHDATA_API
4212
4213	void stb_vorbis_flush_pushdata(stb_vorbis *f)
4214	{
4215	f->previous_length = 0;
4216	f->page_crc_tests = 0;
4217	f->discard_samples_deferred = 0;
4218	f->current_loc_valid = FALSE0;
4219	f->first_decode = FALSE0;
4220	f->samples_output = 0;
4221	f->channel_buffer_start = 0;
4222	f->channel_buffer_end = 0;
4223	}
4224
4225	static int vorbis_search_for_page_pushdata(vorb f, uint8 data, int data_len)
4226	{
4227	int i,n;
4228	for (i=0; i < f->page_crc_tests; ++i)
4229	f->scan[i].bytes_done = 0;
4230
4231	// if we have room for more scans, search for them first, because
4232	// they may cause us to stop early if their header is incomplete
4233	if (f->page_crc_tests < STB_VORBIS_PUSHDATA_CRC_COUNT4) {
4234	if (data_len < 4) return 0;
4235	data_len -= 3; // need to look for 4-byte sequence, so don't miss
4236	// one that straddles a boundary
4237	for (i=0; i < data_len; ++i) {
4238	if (data[i] == 0x4f) {
4239	if (0==memcmp(data+i, ogg_page_header, 4)) {
4240	int j,len;
4241	uint32 crc;
4242	// make sure we have the whole page header
4243	if (i+26 >= data_len \|\| i+27+data[i+26] >= data_len) {
4244	// only read up to this page start, so hopefully we'll
4245	// have the whole page header start next time
4246	data_len = i;
4247	break;
4248	}
4249	// ok, we have it all; compute the length of the page
4250	len = 27 + data[i+26];
4251	for (j=0; j < data[i+26]; ++j)
4252	len += data[i+27+j];
4253	// scan everything up to the embedded crc (which we must 0)
4254	crc = 0;
4255	for (j=0; j < 22; ++j)
4256	crc = crc32_update(crc, data[i+j]);
4257	// now process 4 0-bytes
4258	for ( ; j < 26; ++j)
4259	crc = crc32_update(crc, 0);
4260	// len is the total number of bytes we need to scan
4261	n = f->page_crc_tests++;
4262	f->scan[n].bytes_left = len-j;
4263	f->scan[n].crc_so_far = crc;
4264	f->scan[n].goal_crc = data[i+22] + (data[i+23] << 8) + (data[i+24]<<16) + (data[i+25]<<24);
4265	// if the last frame on a page is continued to the next, then
4266	// we can't recover the sample_loc immediately
4267	if (data[i+27+data[i+26]-1] == 255)
4268	f->scan[n].sample_loc = ~0;
4269	else
4270	f->scan[n].sample_loc = data[i+6] + (data[i+7] << 8) + (data[i+ 8]<<16) + (data[i+ 9]<<24);
4271	f->scan[n].bytes_done = i+j;
4272	if (f->page_crc_tests == STB_VORBIS_PUSHDATA_CRC_COUNT4)
4273	break;
4274	// keep going if we still have room for more
4275	}
4276	}
4277	}
4278	}
4279
4280	for (i=0; i < f->page_crc_tests;) {
4281	uint32 crc;
4282	int j;
4283	int n = f->scan[i].bytes_done;
4284	int m = f->scan[i].bytes_left;
4285	if (m > data_len - n) m = data_len - n;
4286	// m is the bytes to scan in the current chunk
4287	crc = f->scan[i].crc_so_far;
4288	for (j=0; j < m; ++j)
4289	crc = crc32_update(crc, data[n+j]);
4290	f->scan[i].bytes_left -= m;
4291	f->scan[i].crc_so_far = crc;
4292	if (f->scan[i].bytes_left == 0) {
4293	// does it match?
4294	if (f->scan[i].crc_so_far == f->scan[i].goal_crc) {
4295	// Houston, we have page
4296	data_len = n+m; // consumption amount is wherever that scan ended
4297	f->page_crc_tests = -1; // drop out of page scan mode
4298	f->previous_length = 0; // decode-but-don't-output one frame
4299	f->next_seg = -1; // start a new page
4300	f->current_loc = f->scan[i].sample_loc; // set the current sample location
4301	// to the amount we'd have decoded had we decoded this page
4302	f->current_loc_valid = f->current_loc != ~0;
4303	return data_len;
4304	}
4305	// delete entry
4306	f->scan[i] = f->scan[--f->page_crc_tests];
4307	} else {
4308	++i;
4309	}
4310	}
4311
4312	return data_len;
4313	}
4314
4315	// return value: number of bytes we used
4316	int stb_vorbis_decode_frame_pushdata(
4317	stb_vorbis *f, // the file we're decoding
4318	uint8 *data, int data_len, // the memory available for decoding
4319	int channels, // place to write number of float buffers
4320	float *output, // place to write float array of float * buffers
4321	int *samples // place to write number of output samples
4322	)
4323	{
4324	int i;
4325	int len,right,left;
4326
4327	if (!IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing);
4328
4329	if (f->page_crc_tests >= 0) {
4330	*samples = 0;
4331	return vorbis_search_for_page_pushdata(f, data, data_len);
4332	}
4333
4334	f->stream = data;
4335	f->stream_end = data + data_len;
4336	f->error = VORBIS__no_error;
4337
4338	// check that we have the entire packet in memory
4339	if (!is_whole_packet_present(f, FALSE0)) {
4340	*samples = 0;
4341	return 0;
4342	}
4343
4344	if (!vorbis_decode_packet(f, &len, &left, &right)) {
4345	// save the actual error we encountered
4346	enum STBVorbisError error = f->error;
4347	if (error == VORBIS_bad_packet_type) {
4348	// flush and resynch
4349	f->error = VORBIS__no_error;
4350	while (get8_packet(f) != EOP(-1))
4351	if (f->eof) break;
4352	*samples = 0;
4353	return f->stream - data;
4354	}
4355	if (error == VORBIS_continued_packet_flag_invalid) {
4356	if (f->previous_length == 0) {
4357	// we may be resynching, in which case it's ok to hit one
4358	// of these; just discard the packet
4359	f->error = VORBIS__no_error;
4360	while (get8_packet(f) != EOP(-1))
4361	if (f->eof) break;
4362	*samples = 0;
4363	return f->stream - data;
4364	}
4365	}
4366	// if we get an error while parsing, what to do?
4367	// well, it DEFINITELY won't work to continue from where we are!
4368	stb_vorbis_flush_pushdata(f);
4369	// restore the error that actually made us bail
4370	f->error = error;
4371	*samples = 0;
4372	return 1;
4373	}
4374
4375	// success!
4376	len = vorbis_finish_frame(f, len, left, right);
4377	for (i=0; i < f->channels; ++i)
4378	f->outputs[i] = f->channel_buffers[i] + left;
4379
4380	if (channels) *channels = f->channels;
4381	*samples = len;
4382	*output = f->outputs;
4383	return f->stream - data;
4384	}
4385
4386	stb_vorbis *stb_vorbis_open_pushdata(
4387	unsigned char *data, int data_len, // the memory available for decoding
4388	int *data_used, // only defined if result is not NULL
4389	int error, stb_vorbis_alloc alloc)
4390	{
4391	stb_vorbis *f, p;
4392	vorbis_init(&p, alloc);
4393	p.stream = data;
4394	p.stream_end = data + data_len;
4395	p.push_mode = TRUE1;
4396	if (!start_decoder(&p)) {
4397	if (p.eof)
4398	*error = VORBIS_need_more_data;
4399	else
4400	*error = p.error;
4401	return NULL((void*)0);
4402	}
4403	f = vorbis_alloc(&p);
4404	if (f) {
4405	*f = p;
4406	*data_used = f->stream - data;
4407	*error = 0;
4408	return f;
4409	} else {
4410	vorbis_deinit(&p);
4411	return NULL((void*)0);
4412	}
4413	}
4414	#endif // STB_VORBIS_NO_PUSHDATA_API
4415
4416	unsigned int stb_vorbis_get_file_offset(stb_vorbis *f)
4417	{
4418	#ifndef STB_VORBIS_NO_PUSHDATA_API
4419	if (f->push_mode) return 0;
4420	#endif
4421	if (USE_MEMORY(f)((f)->stream)) return f->stream - f->stream_start;
4422	#ifndef STB_VORBIS_NO_STDIO
4423	return ftell(f->f) - f->f_start;
4424	#endif
4425	}
4426
4427	#ifndef STB_VORBIS_NO_PULLDATA_API
4428	//
4429	// DATA-PULLING API
4430	//
4431
4432	static uint32 vorbis_find_page(stb_vorbis f, uint32 end, uint32 *last)
4433	{
4434	for(;;) {
4435	int n;
4436	if (f->eof) return 0;
4437	n = get8(f);
4438	if (n == 0x4f) { // page header
4439	unsigned int retry_loc = stb_vorbis_get_file_offset(f);
4440	int i;
4441	// check if we're off the end of a file_section stream
4442	if (retry_loc - 25 > f->stream_len)
4443	return 0;
4444	// check the rest of the header
4445	for (i=1; i < 4; ++i)
4446	if (get8(f) != ogg_page_header[i])
4447	break;
4448	if (f->eof) return 0;
4449	if (i == 4) {
4450	uint8 header[27];
4451	uint32 i, crc, goal, len;
4452	for (i=0; i < 4; ++i)
4453	header[i] = ogg_page_header[i];
4454	for (; i < 27; ++i)
4455	header[i] = get8(f);
4456	if (f->eof) return 0;
4457	if (header[4] != 0) goto invalid;
4458	goal = header[22] + (header[23] << 8) + (header[24]<<16) + (header[25]<<24);
4459	for (i=22; i < 26; ++i)
4460	header[i] = 0;
4461	crc = 0;
4462	for (i=0; i < 27; ++i)
4463	crc = crc32_update(crc, header[i]);
4464	len = 0;
4465	for (i=0; i < header[26]; ++i) {
4466	int s = get8(f);
4467	crc = crc32_update(crc, s);
4468	len += s;
4469	}
4470	if (len && f->eof) return 0;
4471	for (i=0; i < len; ++i)
4472	crc = crc32_update(crc, get8(f));
4473	// finished parsing probable page
4474	if (crc == goal) {
4475	// we could now check that it's either got the last
4476	// page flag set, OR it's followed by the capture
4477	// pattern, but I guess TECHNICALLY you could have
4478	// a file with garbage between each ogg page and recover
4479	// from it automatically? So even though that paranoia
4480	// might decrease the chance of an invalid decode by
4481	// another 2^32, not worth it since it would hose those
4482	// invalid-but-useful files?
4483	if (end)
4484	*end = stb_vorbis_get_file_offset(f);
4485	if (last)
4486	{
4487	if (header[5] & 0x04)
4488	*last = 1;
4489	else
4490	*last = 0;
4491	}
4492	set_file_offset(f, retry_loc-1);
4493	return 1;
4494	}
4495	}
4496	invalid:
4497	// not a valid page, so rewind and look for next one
4498	set_file_offset(f, retry_loc);
4499	}
4500	}
4501	}
4502
4503	// seek is implemented with 'interpolation search'--this is like
4504	// binary search, but we use the data values to estimate the likely
4505	// location of the data item (plus a bit of a bias so when the
4506	// estimation is wrong we don't waste overly much time)
4507
4508	#define SAMPLE_unknown0xffffffff 0xffffffff
4509
4510
4511	// ogg vorbis, in its insane infinite wisdom, only provides
4512	// information about the sample at the END of the page.
4513	// therefore we COULD have the data we need in the current
4514	// page, and not know it. we could just use the end location
4515	// as our only knowledge for bounds, seek back, and eventually
4516	// the binary search finds it. or we can try to be smart and
4517	// not waste time trying to locate more pages. we try to be
4518	// smart, since this data is already in memory anyway, so
4519	// doing needless I/O would be crazy!
4520	static int vorbis_analyze_page(stb_vorbis f, ProbedPage z)
4521	{
4522	uint8 header[27], lacing[255];
4523	uint8 packet_type[255];
4524	int num_packet, packet_start, previous =0;
4525	(void)previous;
4526	int i,len;
4527	uint32 samples;
4528
4529	// record where the page starts
4530	z->page_start = stb_vorbis_get_file_offset(f);
4531
4532	// parse the header
4533	getn(f, header, 27);
4534	assert(header[0] == 'O' && header[1] == 'g' && header[2] == 'g' && header[3] == 'S')((header[0] == 'O' && header[1] == 'g' && header [2] == 'g' && header[3] == 'S') ? (void)0 : _assert("header[0] == 'O' && header[1] == 'g' && header[2] == 'g' && header[3] == 'S'" , "src/siege/internal/stb/stb_vorbis.c", 4534));
4535	getn(f, lacing, header[26]);
4536
4537	// determine the length of the payload
4538	len = 0;
4539	for (i=0; i < header[26]; ++i)
4540	len += lacing[i];
4541
4542	// this implies where the page ends
4543	z->page_end = z->page_start + 27 + header[26] + len;
4544
4545	// read the last-decoded sample out of the data
4546	z->last_decoded_sample = header[6] + (header[7] << 8) + (header[8] << 16) + (header[9] << 16);
4547
4548	if (header[5] & 4) {
4549	// if this is the last page, it's not possible to work
4550	// backwards to figure out the first sample! whoops! fuck.
4551	z->first_decoded_sample = SAMPLE_unknown0xffffffff;
4552	set_file_offset(f, z->page_start);
4553	return 1;
4554	}
4555
4556	// scan through the frames to determine the sample-count of each one...
4557	// our goal is the sample # of the first fully-decoded sample on the
4558	// page, which is the first decoded sample of the 2nd page
4559
4560	num_packet=0;
4561
4562	packet_start = ((header[5] & 1) == 0);
4563
4564	for (i=0; i < header[26]; ++i) {
4565	if (packet_start) {
4566	uint8 n,b,m;
4567	if (lacing[i] == 0) goto bail; // trying to read from zero-length packet
4568	n = get8(f);
4569	// if bottom bit is non-zero, we've got corruption
4570	if (n & 1) goto bail;
4571	n >>= 1;
4572	b = ilog(f->mode_count-1);
4573	m = n >> b;
4574	n &= (1 << b)-1;
4575	if (n >= f->mode_count) goto bail;
4576	if (num_packet == 0 && f->mode_config[n].blockflag)
4577	previous = (m & 1);
4578	packet_type[num_packet++] = f->mode_config[n].blockflag;
4579	skip(f, lacing[i]-1);
4580	} else
4581	skip(f, lacing[i]);
4582	packet_start = (lacing[i] < 255);
4583	}
4584
4585	// now that we know the sizes of all the pages, we can start determining
4586	// how much sample data there is.
4587
4588	samples = 0;
4589
4590	// for the last packet, we step by its whole length, because the definition
4591	// is that we encoded the end sample loc of the 'last packet completed',
4592	// where 'completed' refers to packets being split, and we are left to guess
4593	// what 'end sample loc' means. we assume it means ignoring the fact that
4594	// the last half of the data is useless without windowing against the next
4595	// packet... (so it's not REALLY complete in that sense)
4596	if (num_packet > 1)
4597	samples += f->blocksize[packet_type[num_packet-1]];
4598
4599	for (i=num_packet-2; i >= 1; --i) {
4600	// now, for this packet, how many samples do we have that
4601	// do not overlap the following packet?
4602	if (packet_type[i] == 1)
4603	if (packet_type[i+1] == 1)
4604	samples += f->blocksize_1 >> 1;
4605	else
4606	samples += ((f->blocksize_1 - f->blocksize_0) >> 2) + (f->blocksize_0 >> 1);
4607	else
4608	samples += f->blocksize_0 >> 1;
4609	}
4610	// now, at this point, we've rewound to the very beginning of the
4611	// _second_ packet. if we entirely discard the first packet after
4612	// a seek, this will be exactly the right sample number. HOWEVER!
4613	// we can't as easily compute this number for the LAST page. The
4614	// only way to get the sample offset of the LAST page is to use
4615	// the end loc from the previous page. But what that returns us
4616	// is _exactly_ the place where we get our first non-overlapped
4617	// sample. (I think. Stupid spec for being ambiguous.) So for
4618	// consistency it's better to do that here, too. However, that
4619	// will then require us to NOT discard all of the first frame we
4620	// decode, in some cases, which means an even weirder frame size
4621	// and extra code. what a fucking pain.
4622
4623	// we're going to discard the first packet if we
4624	// start the seek here, so we don't care about it. (we could actually
4625	// do better; if the first packet is long, and the previous packet
4626	// is short, there's actually data in the first half of the first
4627	// packet that doesn't need discarding... but not worth paying the
4628	// effort of tracking that of that here and in the seeking logic)
4629	// except crap, if we infer it from the _previous_ packet's end
4630	// location, we DO need to use that definition... and we HAVE to
4631	// infer the start loc of the LAST packet from the previous packet's
4632	// end location. fuck you, ogg vorbis.
4633
4634	z->first_decoded_sample = z->last_decoded_sample - samples;
4635
4636	// restore file state to where we were
4637	set_file_offset(f, z->page_start);
4638	return 1;
4639
4640	// restore file state to where we were
4641	bail:
4642	set_file_offset(f, z->page_start);
4643	return 0;
4644	}
4645
4646	static int vorbis_seek_frame_from_page(stb_vorbis *f, uint32 page_start, uint32 first_sample, uint32 target_sample, int fine)
4647	{
4648	int left_start, left_end, right_start, right_end, mode,i;
4649	int frame=0;
4650	uint32 frame_start;
4651	int frames_to_skip, data_to_skip;
4652
4653	// first_sample is the sample # of the first sample that doesn't
4654	// overlap the previous page... note that this requires us to
4655	// _partially_ discard the first packet! bleh.
4656	set_file_offset(f, page_start);
4657
4658	f->next_seg = -1; // force page resync
4659
4660	frame_start = first_sample;
4661	// frame start is where the previous packet's last decoded sample
4662	// was, which corresponds to left_end... EXCEPT if the previous
4663	// packet was long and this packet is short? Probably a bug here.
4664
4665
4666	// now, we can start decoding frames... we'll only FAKE decode them,
4667	// until we find the frame that contains our sample; then we'll rewind,
4668	// and try again
4669	for (;;) {
4670	int start;
4671
4672	if (!vorbis_decode_initial(f, &left_start, &left_end, &right_start, &right_end, &mode))
4673	return error(f, VORBIS_seek_failed);
4674
4675	if (frame == 0)
4676	start = left_end;
4677	else
4678	start = left_start;
4679
4680	// the window starts at left_start; the last valid sample we generate
4681	// before the next frame's window start is right_start-1
4682	if (target_sample < frame_start + right_start-start)
4683	break;
4684
4685	flush_packet(f);
4686	if (f->eof)
4687	return error(f, VORBIS_seek_failed);
4688
4689	frame_start += right_start - start;
4690
4691	++frame;
4692	}
4693
4694	// ok, at this point, the sample we want is contained in frame #'frame'
4695
4696	// to decode frame #'frame' normally, we have to decode the
4697	// previous frame first... but if it's the FIRST frame of the page
4698	// we can't. if it's the first frame, it means it falls in the part
4699	// of the first frame that doesn't overlap either of the other frames.
4700	// so, if we have to handle that case for the first frame, we might
4701	// as well handle it for all of them, so:
4702	if (target_sample > frame_start + (left_end - left_start)) {
4703	// so what we want to do is go ahead and just immediately decode
4704	// this frame, but then make it so the next get_frame_float() uses
4705	// this already-decoded data? or do we want to go ahead and rewind,
4706	// and leave a flag saying to skip the first N data? let's do that
4707	frames_to_skip = frame; // if this is frame #1, skip 1 frame (#0)
4708	data_to_skip = left_end - left_start;
4709	} else {
4710	// otherwise, we want to skip frames 0, 1, 2, ... frame-2
4711	// (which means frame-2+1 total frames) then decode frame-1,
4712	// then leave frame pending
4713	frames_to_skip = frame - 1;
4714	assert(frames_to_skip >= 0)((frames_to_skip >= 0) ? (void)0 : _assert("frames_to_skip >= 0" , "src/siege/internal/stb/stb_vorbis.c", 4714));
4715	data_to_skip = -1;
4716	}
4717
4718	set_file_offset(f, page_start);
4719	f->next_seg = - 1; // force page resync
4720
4721	for (i=0; i < frames_to_skip; ++i) {
4722	maybe_start_packet(f);
4723	flush_packet(f);
4724	}
4725
4726	if (data_to_skip >= 0) {
4727	int i,j,n = f->blocksize_0 >> 1;
4728	f->discard_samples_deferred = data_to_skip;
4729	for (i=0; i < f->channels; ++i)
4730	for (j=0; j < n; ++j)
4731	f->previous_window[i][j] = 0;
4732	f->previous_length = n;
4733	frame_start += data_to_skip;
4734	} else {
4735	f->previous_length = 0;
4736	vorbis_pump_first_frame(f);
4737	}
4738
4739	// at this point, the NEXT decoded frame will generate the desired sample
4740	if (fine) {
4741	// so if we're doing sample accurate streaming, we want to go ahead and decode it!
4742	if (target_sample != frame_start) {
4743	int n;
4744	stb_vorbis_get_frame_float(f, &n, NULL((void*)0));
4745	assert(target_sample > frame_start)((target_sample > frame_start) ? (void)0 : _assert("target_sample > frame_start" , "src/siege/internal/stb/stb_vorbis.c", 4745));
4746	assert(f->channel_buffer_start + (int) (target_sample-frame_start) < f->channel_buffer_end)((f->channel_buffer_start + (int) (target_sample-frame_start ) < f->channel_buffer_end) ? (void)0 : _assert("f->channel_buffer_start + (int) (target_sample-frame_start) < f->channel_buffer_end" , "src/siege/internal/stb/stb_vorbis.c", 4746));
4747	f->channel_buffer_start += (target_sample - frame_start);
4748	}
4749	}
4750
4751	return 0;
4752	}
4753
4754	static int vorbis_seek_base(stb_vorbis *f, unsigned int sample_number, int fine)
4755	{
4756	ProbedPage p[2],q;
4757	if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing);
4758
4759	// do we know the location of the last page?
4760	if (f->p_last.page_start == 0) {
4761	uint32 z = stb_vorbis_stream_length_in_samples(f);
4762	if (z == 0) return error(f, VORBIS_cant_find_last_page);
4763	}
4764
4765	p[0] = f->p_first;
4766	p[1] = f->p_last;
4767
4768	if (sample_number >= f->p_last.last_decoded_sample)
4769	sample_number = f->p_last.last_decoded_sample-1;
4770
4771	if (sample_number < f->p_first.last_decoded_sample) {
4772	vorbis_seek_frame_from_page(f, p[0].page_start, 0, sample_number, fine);
4773	return 0;
4774	} else {
4775	int attempts=0;
4776	while (p[0].page_end < p[1].page_start) {
4777	uint32 probe;
4778	uint32 start_offset, end_offset;
4779	uint32 start_sample, end_sample;
4780
4781	// copy these into local variables so we can tweak them
4782	// if any are unknown
4783	start_offset = p[0].page_end;
4784	end_offset = p[1].after_previous_page_start; // an address known to seek to page p[1]
4785	start_sample = p[0].last_decoded_sample;
4786	end_sample = p[1].last_decoded_sample;
4787
4788	// currently there is no such tweaking logic needed/possible?
4789	if (start_sample == SAMPLE_unknown0xffffffff \|\| end_sample == SAMPLE_unknown0xffffffff)
4790	return error(f, VORBIS_seek_failed);
4791
4792	// now we want to lerp between these for the target samples...
4793
4794	// step 1: we need to bias towards the page start...
4795	if (start_offset + 4000 < end_offset)
4796	end_offset -= 4000;
4797
4798	// now compute an interpolated search loc
4799	probe = start_offset + (int) floor((float) (end_offset - start_offset) / (end_sample - start_sample) * (sample_number - start_sample));
4800
4801	// next we need to bias towards binary search...
4802	// code is a little wonky to allow for full 32-bit unsigned values
4803	if (attempts >= 4) {
4804	uint32 probe2 = start_offset + ((end_offset - start_offset) >> 1);
4805	if (attempts >= 8)
4806	probe = probe2;
4807	else if (probe < probe2)
4808	probe = probe + ((probe2 - probe) >> 1);
4809	else
4810	probe = probe2 + ((probe - probe2) >> 1);
4811	}
4812	++attempts;
4813
4814	set_file_offset(f, probe);
4815	if (!vorbis_find_page(f, NULL((void)0), NULL((void)0))) return error(f, VORBIS_seek_failed);
4816	if (!vorbis_analyze_page(f, &q)) return error(f, VORBIS_seek_failed);
4817	q.after_previous_page_start = probe;
4818
4819	// it's possible we've just found the last page again
4820	if (q.page_start == p[1].page_start) {
4821	p[1] = q;
4822	continue;
4823	}
4824
4825	if (sample_number < q.last_decoded_sample)
4826	p[1] = q;
4827	else
4828	p[0] = q;
4829	}
4830
4831	if (p[0].last_decoded_sample <= sample_number && sample_number < p[1].last_decoded_sample) {
4832	vorbis_seek_frame_from_page(f, p[1].page_start, p[0].last_decoded_sample, sample_number, fine);
4833	return 0;
4834	}
4835	return error(f, VORBIS_seek_failed);
4836	}
4837	}
4838
4839	int stb_vorbis_seek_frame(stb_vorbis *f, unsigned int sample_number)
4840	{
4841	return vorbis_seek_base(f, sample_number, FALSE0);
4842	}
4843
4844	int stb_vorbis_seek(stb_vorbis *f, unsigned int sample_number)
4845	{
4846	return vorbis_seek_base(f, sample_number, TRUE1);
4847	}
4848
4849	void stb_vorbis_seek_start(stb_vorbis *f)
4850	{
4851	if (IS_PUSH_MODE(f)((f)->push_mode)) { error(f, VORBIS_invalid_api_mixing); return; }
4852	set_file_offset(f, f->first_audio_page_offset);
4853	f->previous_length = 0;
4854	f->first_decode = TRUE1;
4855	f->next_seg = -1;
4856	vorbis_pump_first_frame(f);
4857	}
4858
4859	unsigned int stb_vorbis_stream_length_in_samples(stb_vorbis *f)
4860	{
4861	unsigned int restore_offset, previous_safe;
4862	unsigned int end, last_page_loc;
4863
4864	if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing);
4865	if (!f->total_samples) {
4866	int last;
4867	uint32 lo,hi;
4868	char header[6];
4869
4870	// first, store the current decode position so we can restore it
4871	restore_offset = stb_vorbis_get_file_offset(f);
4872
4873	// now we want to seek back 64K from the end (the last page must
4874	// be at most a little less than 64K, but let's allow a little slop)
4875	if (f->stream_len >= 65536 && f->stream_len-65536 >= f->first_audio_page_offset)
4876	previous_safe = f->stream_len - 65536;
4877	else
4878	previous_safe = f->first_audio_page_offset;
4879
4880	set_file_offset(f, previous_safe);
4881	// previous_safe is now our candidate 'earliest known place that seeking
4882	// to will lead to the final page'
4883
4884	if (!vorbis_find_page(f, &end, (int unsigned *)&last)) {
4885	// if we can't find a page, we're hosed!
4886	f->error = VORBIS_cant_find_last_page;
4887	f->total_samples = 0xffffffff;
4888	goto done;
4889	}
4890
4891	// check if there are more pages
4892	last_page_loc = stb_vorbis_get_file_offset(f);
4893
4894	// stop when the last_page flag is set, not when we reach eof;
4895	// this allows us to stop short of a 'file_section' end without
4896	// explicitly checking the length of the section
4897	while (!last) {
4898	set_file_offset(f, end);
4899	if (!vorbis_find_page(f, &end, (int unsigned *)&last)) {
4900	// the last page we found didn't have the 'last page' flag
4901	// set. whoops!
4902	break;
4903	}
4904	previous_safe = last_page_loc+1;
4905	last_page_loc = stb_vorbis_get_file_offset(f);
4906	}
4907
4908	set_file_offset(f, last_page_loc);
4909
4910	// parse the header
4911	getn(f, (unsigned char *)header, 6);
4912	// extract the absolute granule position
4913	lo = get32(f);
4914	hi = get32(f);
4915	if (lo == 0xffffffff && hi == 0xffffffff) {
4916	f->error = VORBIS_cant_find_last_page;
4917	f->total_samples = SAMPLE_unknown0xffffffff;
4918	goto done;
4919	}
4920	if (hi)
4921	lo = 0xfffffffe; // saturate
4922	f->total_samples = lo;
4923
4924	f->p_last.page_start = last_page_loc;
4925	f->p_last.page_end = end;
4926	f->p_last.last_decoded_sample = lo;
4927	f->p_last.first_decoded_sample = SAMPLE_unknown0xffffffff;
4928	f->p_last.after_previous_page_start = previous_safe;
4929
4930	done:
4931	set_file_offset(f, restore_offset);
4932	}
4933	return f->total_samples == SAMPLE_unknown0xffffffff ? 0 : f->total_samples;
4934	}
4935
4936	float stb_vorbis_stream_length_in_seconds(stb_vorbis *f)
4937	{
4938	return stb_vorbis_stream_length_in_samples(f) / (float) f->sample_rate;
4939	}
4940
4941
4942
4943	int stb_vorbis_get_frame_float(stb_vorbis f, int channels, float ***output)
4944	{
4945	int len, right,left,i;
4946	if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing);
4947
4948	if (!vorbis_decode_packet(f, &len, &left, &right)) {
4949	f->channel_buffer_start = f->channel_buffer_end = 0;
4950	return 0;
4951	}
4952
4953	len = vorbis_finish_frame(f, len, left, right);
4954	for (i=0; i < f->channels; ++i)
4955	f->outputs[i] = f->channel_buffers[i] + left;
4956
4957	f->channel_buffer_start = left;
4958	f->channel_buffer_end = left+len;
4959
4960	if (channels) *channels = f->channels;
4961	if (output) *output = f->outputs;
4962	return len;
4963	}
4964
4965	#ifndef STB_VORBIS_NO_STDIO
4966
4967	stb_vorbis * stb_vorbis_open_file_section(FILE file, int close_on_free, int error, stb_vorbis_alloc *alloc, unsigned int length)
4968	{
4969	stb_vorbis *f, p;
4970	vorbis_init(&p, alloc);
4971	p.f = file;
4972	p.f_start = ftell(file);
4973	p.stream_len = length;
4974	p.close_on_free = close_on_free;
4975	if (start_decoder(&p)) {
4976	f = vorbis_alloc(&p);
4977	if (f) {
4978	*f = p;
4979	vorbis_pump_first_frame(f);
4980	return f;
4981	}
4982	}
4983	if (error) *error = p.error;
4984	vorbis_deinit(&p);
4985	return NULL((void*)0);
4986	}
4987
4988	stb_vorbis * stb_vorbis_open_file(FILE file, int close_on_free, int error, stb_vorbis_alloc *alloc)
4989	{
4990	unsigned int len, start;
4991	start = ftell(file);
4992	fseek(file, 0, SEEK_END2);
4993	len = ftell(file) - start;
4994	fseek(file, start, SEEK_SET0);
4995	return stb_vorbis_open_file_section(file, close_on_free, error, alloc, len);
4996	}
4997
4998	stb_vorbis * stb_vorbis_open_filename(char filename, int error, stb_vorbis_alloc *alloc)
4999	{
5000	FILE *f = fopen(filename, "rb");
5001	if (f)
5002	return stb_vorbis_open_file(f, TRUE1, error, alloc);
5003	if (error) *error = VORBIS_file_open_failure;
5004	return NULL((void*)0);
5005	}
5006	#endif // STB_VORBIS_NO_STDIO
5007
5008	stb_vorbis * stb_vorbis_open_memory(unsigned char data, int len, int error, stb_vorbis_alloc *alloc)
5009	{
5010	stb_vorbis *f, p;
5011	if (data == NULL((void)0)) return NULL((void)0);
5012	vorbis_init(&p, alloc);
5013	p.stream = data;
5014	p.stream_end = data + len;
5015	p.stream_start = p.stream;
5016	p.stream_len = len;
5017	p.push_mode = FALSE0;
5018	if (start_decoder(&p)) {
5019	f = vorbis_alloc(&p);
5020	if (f) {
5021	*f = p;
5022	vorbis_pump_first_frame(f);
5023	return f;
5024	}
5025	}
5026	if (error) *error = p.error;
5027	vorbis_deinit(&p);
5028	return NULL((void*)0);
5029	}
5030
5031	#ifndef STB_VORBIS_NO_INTEGER_CONVERSION
5032	#define PLAYBACK_MONO1 1
5033	#define PLAYBACK_LEFT2 2
5034	#define PLAYBACK_RIGHT4 4
5035
5036	#define L(2 \| 1) (PLAYBACK_LEFT2 \| PLAYBACK_MONO1)
5037	#define C(2 \| 4 \| 1) (PLAYBACK_LEFT2 \| PLAYBACK_RIGHT4 \| PLAYBACK_MONO1)
5038	#define R(4 \| 1) (PLAYBACK_RIGHT4 \| PLAYBACK_MONO1)
5039
5040	static int8 channel_position[7][6] =
5041	{
5042	{ 0 },
5043	{ C(2 \| 4 \| 1) },
5044	{ L(2 \| 1), R(4 \| 1) },
5045	{ L(2 \| 1), C(2 \| 4 \| 1), R(4 \| 1) },
5046	{ L(2 \| 1), R(4 \| 1), L(2 \| 1), R(4 \| 1) },
5047	{ L(2 \| 1), C(2 \| 4 \| 1), R(4 \| 1), L(2 \| 1), R(4 \| 1) },
5048	{ L(2 \| 1), C(2 \| 4 \| 1), R(4 \| 1), L(2 \| 1), R(4 \| 1), C(2 \| 4 \| 1) },
5049	};
5050
5051
5052	#ifndef STB_VORBIS_NO_FAST_SCALED_FLOAT
5053	typedef union {
5054	float f;
5055	int i;
5056	} float_conv;
5057	typedef char stb_vorbis_float_size_test[sizeof(float)==4 && sizeof(int) == 4];
5058	#define FASTDEF(x)float_conv x float_conv x
5059	// add (1<<23) to convert to int, then divide by 2^SHIFT, then add 0.5/2^SHIFT to round
5060	#define MAGIC(SHIFT)(1.5f * (1 << (23-SHIFT)) + 0.5f/(1 << SHIFT)) (1.5f * (1 << (23-SHIFT)) + 0.5f/(1 << SHIFT))
5061	#define ADDEND(SHIFT)(((150-SHIFT) << 23) + (1 << 22)) (((150-SHIFT) << 23) + (1 << 22))
5062	#define FAST_SCALED_FLOAT_TO_INT(temp,x,s)(temp.f = (x) + (1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - (((150-s) << 23) + (1 << 22))) (temp.f = (x) + MAGIC(s)(1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - ADDEND(s)(((150-s) << 23) + (1 << 22)))
5063	#define check_endianness()
5064	#else
5065	#define FAST_SCALED_FLOAT_TO_INT(temp,x,s)(temp.f = (x) + (1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - (((150-s) << 23) + (1 << 22))) ((int) ((x) * (1 << (s))))
5066	#define check_endianness()
5067	#define FASTDEF(x)float_conv x
5068	#endif
5069
5070	static void copy_samples(short dest, float src, int len)
5071	{
5072	int i;
5073	check_endianness();
5074	for (i=0; i < len; ++i) {
5075	FASTDEF(temp)float_conv temp;
5076	int v = FAST_SCALED_FLOAT_TO_INT(temp, src[i],15)(temp.f = (src[i]) + (1.5f * (1 << (23-15)) + 0.5f/(1 << 15)), temp.i - (((150-15) << 23) + (1 << 22)));
5077	if ((unsigned int) (v + 32768) > 65535)
5078	v = v < 0 ? -32768 : 32767;
5079	dest[i] = v;
5080	}
5081	}
5082
5083	static void compute_samples(int mask, short output, int num_c, float *data, int d_offset, int len)
5084	{
5085	#define BUFFER_SIZE32 32
5086	float buffer[BUFFER_SIZE32];
5087	int i,j,o,n = BUFFER_SIZE32;
5088	check_endianness();
5089	for (o = 0; o < len; o += BUFFER_SIZE32) {
5090	memset(buffer, 0, sizeof(buffer));
5091	if (o + n > len) n = len - o;
5092	for (j=0; j < num_c; ++j) {
5093	if (channel_position[num_c][j] & mask) {
5094	for (i=0; i < n; ++i)
5095	buffer[i] += data[j][d_offset+o+i];
5096	}
5097	}
5098	for (i=0; i < n; ++i) {
5099	FASTDEF(temp)float_conv temp;
5100	int v = FAST_SCALED_FLOAT_TO_INT(temp,buffer[i],15)(temp.f = (buffer[i]) + (1.5f * (1 << (23-15)) + 0.5f/( 1 << 15)), temp.i - (((150-15) << 23) + (1 << 22)));
5101	if ((unsigned int) (v + 32768) > 65535)
5102	v = v < 0 ? -32768 : 32767;
5103	output[o+i] = v;
5104	}
5105	}
5106	}
5107
5108	static int channel_selector[3][2] = { {0}, {PLAYBACK_MONO1}, {PLAYBACK_LEFT2, PLAYBACK_RIGHT4} };
5109	static void compute_stereo_samples(short output, int num_c, float *data, int d_offset, int len)
5110	{
5111	#define BUFFER_SIZE32 32
5112	float buffer[BUFFER_SIZE32];
5113	int i,j,o,n = BUFFER_SIZE32 >> 1;
5114	// o is the offset in the source data
5115	check_endianness();
5116	for (o = 0; o < len; o += BUFFER_SIZE32 >> 1) {
5117	// o2 is the offset in the output data
5118	int o2 = o << 1;
5119	memset(buffer, 0, sizeof(buffer));
5120	if (o + n > len) n = len - o;
5121	for (j=0; j < num_c; ++j) {
5122	int m = channel_position[num_c][j] & (PLAYBACK_LEFT2 \| PLAYBACK_RIGHT4);
5123	if (m == (PLAYBACK_LEFT2 \| PLAYBACK_RIGHT4)) {
5124	for (i=0; i < n; ++i) {
5125	buffer[i*2+0] += data[j][d_offset+o+i];
5126	buffer[i*2+1] += data[j][d_offset+o+i];
5127	}
5128	} else if (m == PLAYBACK_LEFT2) {
5129	for (i=0; i < n; ++i) {
5130	buffer[i*2+0] += data[j][d_offset+o+i];
5131	}
5132	} else if (m == PLAYBACK_RIGHT4) {
5133	for (i=0; i < n; ++i) {
5134	buffer[i*2+1] += data[j][d_offset+o+i];
5135	}
5136	}
5137	}
5138	for (i=0; i < (n<<1); ++i) {
5139	FASTDEF(temp)float_conv temp;
5140	int v = FAST_SCALED_FLOAT_TO_INT(temp,buffer[i],15)(temp.f = (buffer[i]) + (1.5f * (1 << (23-15)) + 0.5f/( 1 << 15)), temp.i - (((150-15) << 23) + (1 << 22)));
5141	if ((unsigned int) (v + 32768) > 65535)
5142	v = v < 0 ? -32768 : 32767;
5143	output[o2+i] = v;
5144	}
5145	}
5146	}
5147
5148	static void convert_samples_short(int buf_c, short buffer, int b_offset, int data_c, float data, int d_offset, int samples)
5149	{
5150	int i;
5151	if (buf_c != data_c && buf_c <= 2 && data_c <= 6) {
5152	static int channel_selector[3][2] = { {0}, {PLAYBACK_MONO1}, {PLAYBACK_LEFT2, PLAYBACK_RIGHT4} };
5153	for (i=0; i < buf_c; ++i)
5154	compute_samples(channel_selector[buf_c][i], buffer[i]+b_offset, data_c, data, d_offset, samples);
5155	} else {
5156	int limit = buf_c < data_c ? buf_c : data_c;
5157	for (i=0; i < limit; ++i)
5158	copy_samples(buffer[i]+b_offset, data[i], samples);
5159	for ( ; i < buf_c; ++i)
5160	memset(buffer[i]+b_offset, 0, sizeof(short) * samples);
5161	}
5162	}
5163
5164	int stb_vorbis_get_frame_short(stb_vorbis f, int num_c, short *buffer, int num_samples)
5165	{
5166	float **output;
5167	int len = stb_vorbis_get_frame_float(f, NULL((void*)0), &output);
5168	if (len > num_samples) len = num_samples;
5169	if (len)
5170	convert_samples_short(num_c, buffer, 0, f->channels, output, 0, len);
5171	return len;
5172	}
5173
5174	static void convert_channels_short_interleaved(int buf_c, short buffer, int data_c, float *data, int d_offset, int len)
5175	{
5176	int i;
5177	check_endianness();
5178	if (buf_c != data_c && buf_c <= 2 && data_c <= 6) {
5179	assert(buf_c == 2)((buf_c == 2) ? (void)0 : _assert("buf_c == 2", "src/siege/internal/stb/stb_vorbis.c" , 5179));
5180	for (i=0; i < buf_c; ++i)
5181	compute_stereo_samples(buffer, data_c, data, d_offset, len);
5182	} else {
5183	int limit = buf_c < data_c ? buf_c : data_c;
5184	int j;
5185	for (j=0; j < len; ++j) {
5186	for (i=0; i < limit; ++i) {
5187	FASTDEF(temp)float_conv temp;
5188	float f = data[i][d_offset+j];
5189	int v = FAST_SCALED_FLOAT_TO_INT(temp, f,15)(temp.f = (f) + (1.5f * (1 << (23-15)) + 0.5f/(1 << 15)), temp.i - (((150-15) << 23) + (1 << 22)));//data[i][d_offset+j],15);
5190	if ((unsigned int) (v + 32768) > 65535)
5191	v = v < 0 ? -32768 : 32767;
5192	*buffer++ = v;
5193	}
5194	for ( ; i < buf_c; ++i)
5195	*buffer++ = 0;
5196	}
5197	}
5198	}
5199
5200	int stb_vorbis_get_frame_short_interleaved(stb_vorbis f, int num_c, short buffer, int num_shorts)
5201	{
5202	float **output;
5203	int len;
5204	if (num_c == 1) return stb_vorbis_get_frame_short(f,num_c,&buffer, num_shorts);
5205	len = stb_vorbis_get_frame_float(f, NULL((void*)0), &output);
5206	if (len) {
5207	if (len*num_c > num_shorts) len = num_shorts / num_c;
5208	convert_channels_short_interleaved(num_c, buffer, f->channels, output, 0, len);
5209	}
5210	return len;
5211	}
5212
5213	int stb_vorbis_get_samples_short_interleaved(stb_vorbis f, int channels, short buffer, int num_shorts)
5214	{
5215	float **outputs;
5216	int len = num_shorts / channels;
5217	int n=0;
5218	int z = f->channels;
5219	if (z > channels) z = channels;
5220	while (n < len) {
5221	int k = f->channel_buffer_end - f->channel_buffer_start;
5222	if (n+k >= len) k = len - n;
5223	if (k)
5224	convert_channels_short_interleaved(channels, buffer, f->channels, f->channel_buffers, f->channel_buffer_start, k);
5225	buffer += k*channels;
5226	n += k;
5227	f->channel_buffer_start += k;
5228	if (n == len) break;
5229	if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break;
5230	}
5231	return n;
5232	}
5233
5234	int stb_vorbis_get_samples_short(stb_vorbis f, int channels, short *buffer, int len)
5235	{
5236	float **outputs;
5237	int n=0;
5238	int z = f->channels;
5239	if (z > channels) z = channels;
	Value stored to 'z' is never read
5240	while (n < len) {
5241	int k = f->channel_buffer_end - f->channel_buffer_start;
5242	if (n+k >= len) k = len - n;
5243	if (k)
5244	convert_samples_short(channels, buffer, n, f->channels, f->channel_buffers, f->channel_buffer_start, k);
5245	n += k;
5246	f->channel_buffer_start += k;
5247	if (n == len) break;
5248	if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break;
5249	}
5250	return n;
5251	}
5252
5253	#ifndef STB_VORBIS_NO_STDIO
5254	int stb_vorbis_decode_filename(char filename, int channels, short **output)
5255	{
5256	int data_len, offset, total, limit, error;
5257	short *data;
5258	stb_vorbis v = stb_vorbis_open_filename(filename, &error, NULL((void)0));
5259	if (v == NULL((void*)0)) return -1;
5260	limit = v->channels * 4096;
5261	*channels = v->channels;
5262	offset = data_len = 0;
5263	total = limit;
5264	data = (short ) malloc(total sizeof(*data));
5265	if (data == NULL((void*)0)) {
5266	stb_vorbis_close(v);
5267	return -2;
5268	}
5269	for (;;) {
5270	int n = stb_vorbis_get_frame_short_interleaved(v, v->channels, data+offset, total-offset);
5271	if (n == 0) break;
5272	data_len += n;
5273	offset += n * v->channels;
5274	if (offset + limit > total) {
5275	short *data2;
5276	total *= 2;
5277	data2 = (short ) realloc(data, total sizeof(*data));
5278	if (data2 == NULL((void*)0)) {
5279	free(data);
5280	stb_vorbis_close(v);
5281	return -2;
5282	}
5283	data = data2;
5284	}
5285	}
5286	*output = data;
5287	return data_len;
5288	}
5289	#endif // NO_STDIO
5290
5291	int stb_vorbis_decode_memory(uint8 mem, int len, int channels, short **output)
5292	{
5293	int data_len, offset, total, limit, error;
5294	short *data;
5295	stb_vorbis v = stb_vorbis_open_memory(mem, len, &error, NULL((void)0));
5296	if (v == NULL((void*)0)) return -1;
5297	limit = v->channels * 4096;
5298	*channels = v->channels;
5299	offset = data_len = 0;
5300	total = limit;
5301	data = (short ) malloc(total sizeof(*data));
5302	if (data == NULL((void*)0)) {
5303	stb_vorbis_close(v);
5304	return -2;
5305	}
5306	for (;;) {
5307	int n = stb_vorbis_get_frame_short_interleaved(v, v->channels, data+offset, total-offset);
5308	if (n == 0) break;
5309	data_len += n;
5310	offset += n * v->channels;
5311	if (offset + limit > total) {
5312	short *data2;
5313	total *= 2;
5314	data2 = (short ) realloc(data, total sizeof(*data));
5315	if (data2 == NULL((void*)0)) {
5316	free(data);
5317	stb_vorbis_close(v);
5318	return -2;
5319	}
5320	data = data2;
5321	}
5322	}
5323	*output = data;
5324	return data_len;
5325	}
5326	#endif
5327
5328	int stb_vorbis_get_samples_float_interleaved(stb_vorbis f, int channels, float buffer, int num_floats)
5329	{
5330	float **outputs;
5331	int len = num_floats / channels;
5332	int n=0;
5333	int z = f->channels;
5334	if (z > channels) z = channels;
5335	while (n < len) {
5336	int i,j;
5337	int k = f->channel_buffer_end - f->channel_buffer_start;
5338	if (n+k >= len) k = len - n;
5339	for (j=0; j < k; ++j) {
5340	for (i=0; i < z; ++i)
5341	*buffer++ = f->channel_buffers[i][f->channel_buffer_start+j];
5342	for ( ; i < channels; ++i)
5343	*buffer++ = 0;
5344	}
5345	n += k;
5346	f->channel_buffer_start += k;
5347	if (n == len) break;
5348	if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break;
5349	}
5350	return n;
5351	}
5352
5353	int stb_vorbis_get_samples_float(stb_vorbis f, int channels, float *buffer, int num_samples)
5354	{
5355	float **outputs;
5356	int n=0;
5357	int z = f->channels;
5358	if (z > channels) z = channels;
5359	while (n < num_samples) {
5360	int i;
5361	int k = f->channel_buffer_end - f->channel_buffer_start;
5362	if (n+k >= num_samples) k = num_samples - n;
5363	if (k) {
5364	for (i=0; i < z; ++i)
5365	memcpy(buffer[i]+n, f->channel_buffers+f->channel_buffer_start, sizeof(float)*k);
5366	for ( ; i < channels; ++i)
5367	memset(buffer[i]+n, 0, sizeof(float) * k);
5368	}
5369	n += k;
5370	f->channel_buffer_start += k;
5371	if (n == num_samples) break;
5372	if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break;
5373	}
5374	return n;
5375	}
5376	#endif // STB_VORBIS_NO_PULLDATA_API
5377
5378	void _dummyFunction(void)
5379	{
5380	(void)get_bits_signed;
5381	(void)codebook_decode_scalar;
5382	(void)channel_selector;
5383	}
5384
5385	#endif // STB_VORBIS_HEADER_ONLY