File: | c:\siege\siege/src/siege/internal/stb/stb_vorbis.c |
Location: | line 4540, column 11 |
Description: | Assigned value is garbage or undefined |
1 | // Ogg Vorbis I audio decoder -- version 0.99996 | |||
2 | // | |||
3 | // Written in April 2007 by Sean Barrett, sponsored by RAD Game Tools. | |||
4 | // | |||
5 | // Placed in the public domain April 2007 by the author: no copyright is | |||
6 | // claimed, and you may use it for any purpose you like. | |||
7 | // | |||
8 | // No warranty for any purpose is expressed or implied by the author (nor | |||
9 | // by RAD Game Tools). Report bugs and send enhancements to the author. | |||
10 | // | |||
11 | // Get the latest version and other information at: | |||
12 | // http://nothings.org/stb_vorbis/ | |||
13 | ||||
14 | ||||
15 | // Todo: | |||
16 | // | |||
17 | // - seeking (note you can seek yourself using the pushdata API) | |||
18 | // | |||
19 | // Limitations: | |||
20 | // | |||
21 | // - floor 0 not supported (used in old ogg vorbis files) | |||
22 | // - lossless sample-truncation at beginning ignored | |||
23 | // - cannot concatenate multiple vorbis streams | |||
24 | // - sample positions are 32-bit, limiting seekable 192Khz | |||
25 | // files to around 6 hours (Ogg supports 64-bit) | |||
26 | // | |||
27 | // All of these limitations may be removed in future versions. | |||
28 | ||||
29 | ||||
30 | ////////////////////////////////////////////////////////////////////////////// | |||
31 | // | |||
32 | // HEADER BEGINS HERE | |||
33 | // | |||
34 | ||||
35 | #ifndef STB_VORBIS_INCLUDE_STB_VORBIS_H | |||
36 | #define STB_VORBIS_INCLUDE_STB_VORBIS_H | |||
37 | ||||
38 | #if defined(STB_VORBIS_NO_CRT) && !defined(STB_VORBIS_NO_STDIO) | |||
39 | #define STB_VORBIS_NO_STDIO 1 | |||
40 | #endif | |||
41 | ||||
42 | #ifndef STB_VORBIS_NO_STDIO | |||
43 | #include <stdio.h> | |||
44 | #endif | |||
45 | ||||
46 | #ifdef __cplusplus | |||
47 | extern "C" { | |||
48 | #endif | |||
49 | ||||
50 | /////////// THREAD SAFETY | |||
51 | ||||
52 | // Individual stb_vorbis* handles are not thread-safe; you cannot decode from | |||
53 | // them from multiple threads at the same time. However, you can have multiple | |||
54 | // stb_vorbis* handles and decode from them independently in multiple thrads. | |||
55 | ||||
56 | ||||
57 | /////////// MEMORY ALLOCATION | |||
58 | ||||
59 | // normally stb_vorbis uses malloc() to allocate memory at startup, | |||
60 | // and alloca() to allocate temporary memory during a frame on the | |||
61 | // stack. (Memory consumption will depend on the amount of setup | |||
62 | // data in the file and how you set the compile flags for speed | |||
63 | // vs. size. In my test files the maximal-size usage is ~150KB.) | |||
64 | // | |||
65 | // You can modify the wrapper functions in the source (setup_malloc, | |||
66 | // setup_temp_malloc, temp_malloc) to change this behavior, or you | |||
67 | // can use a simpler allocation model: you pass in a buffer from | |||
68 | // which stb_vorbis will allocate _all_ its memory (including the | |||
69 | // temp memory). "open" may fail with a VORBIS_outofmem if you | |||
70 | // do not pass in enough data; there is no way to determine how | |||
71 | // much you do need except to succeed (at which point you can | |||
72 | // query get_info to find the exact amount required. yes I know | |||
73 | // this is lame). | |||
74 | // | |||
75 | // If you pass in a non-NULL buffer of the type below, allocation | |||
76 | // will occur from it as described above. Otherwise just pass NULL | |||
77 | // to use malloc()/alloca() | |||
78 | ||||
79 | typedef struct | |||
80 | { | |||
81 | char *alloc_buffer; | |||
82 | int alloc_buffer_length_in_bytes; | |||
83 | } stb_vorbis_alloc; | |||
84 | ||||
85 | ||||
86 | /////////// FUNCTIONS USEABLE WITH ALL INPUT MODES | |||
87 | ||||
88 | typedef struct stb_vorbis stb_vorbis; | |||
89 | ||||
90 | typedef struct | |||
91 | { | |||
92 | unsigned int sample_rate; | |||
93 | int channels; | |||
94 | ||||
95 | unsigned int setup_memory_required; | |||
96 | unsigned int setup_temp_memory_required; | |||
97 | unsigned int temp_memory_required; | |||
98 | ||||
99 | int max_frame_size; | |||
100 | } stb_vorbis_info; | |||
101 | ||||
102 | // get general information about the file | |||
103 | extern stb_vorbis_info stb_vorbis_get_info(stb_vorbis *f); | |||
104 | ||||
105 | // get the last error detected (clears it, too) | |||
106 | extern int stb_vorbis_get_error(stb_vorbis *f); | |||
107 | ||||
108 | // close an ogg vorbis file and free all memory in use | |||
109 | extern void stb_vorbis_close(stb_vorbis *f); | |||
110 | ||||
111 | // this function returns the offset (in samples) from the beginning of the | |||
112 | // file that will be returned by the next decode, if it is known, or -1 | |||
113 | // otherwise. after a flush_pushdata() call, this may take a while before | |||
114 | // it becomes valid again. | |||
115 | // NOT WORKING YET after a seek with PULLDATA API | |||
116 | extern int stb_vorbis_get_sample_offset(stb_vorbis *f); | |||
117 | ||||
118 | // returns the current seek point within the file, or offset from the beginning | |||
119 | // of the memory buffer. In pushdata mode it returns 0. | |||
120 | extern unsigned int stb_vorbis_get_file_offset(stb_vorbis *f); | |||
121 | ||||
122 | /////////// PUSHDATA API | |||
123 | ||||
124 | #ifndef STB_VORBIS_NO_PUSHDATA_API | |||
125 | ||||
126 | // this API allows you to get blocks of data from any source and hand | |||
127 | // them to stb_vorbis. you have to buffer them; stb_vorbis will tell | |||
128 | // you how much it used, and you have to give it the rest next time; | |||
129 | // and stb_vorbis may not have enough data to work with and you will | |||
130 | // need to give it the same data again PLUS more. Note that the Vorbis | |||
131 | // specification does not bound the size of an individual frame. | |||
132 | ||||
133 | extern stb_vorbis *stb_vorbis_open_pushdata( | |||
134 | unsigned char *datablock, int datablock_length_in_bytes, | |||
135 | int *datablock_memory_consumed_in_bytes, | |||
136 | int *error, | |||
137 | stb_vorbis_alloc *alloc_buffer); | |||
138 | // create a vorbis decoder by passing in the initial data block containing | |||
139 | // the ogg&vorbis headers (you don't need to do parse them, just provide | |||
140 | // the first N bytes of the file--you're told if it's not enough, see below) | |||
141 | // on success, returns an stb_vorbis *, does not set error, returns the amount of | |||
142 | // data parsed/consumed on this call in *datablock_memory_consumed_in_bytes; | |||
143 | // on failure, returns NULL on error and sets *error, does not change *datablock_memory_consumed | |||
144 | // if returns NULL and *error is VORBIS_need_more_data, then the input block was | |||
145 | // incomplete and you need to pass in a larger block from the start of the file | |||
146 | ||||
147 | extern int stb_vorbis_decode_frame_pushdata( | |||
148 | stb_vorbis *f, unsigned char *datablock, int datablock_length_in_bytes, | |||
149 | int *channels, // place to write number of float * buffers | |||
150 | float ***output, // place to write float ** array of float * buffers | |||
151 | int *samples // place to write number of output samples | |||
152 | ); | |||
153 | // decode a frame of audio sample data if possible from the passed-in data block | |||
154 | // | |||
155 | // return value: number of bytes we used from datablock | |||
156 | // possible cases: | |||
157 | // 0 bytes used, 0 samples output (need more data) | |||
158 | // N bytes used, 0 samples output (resynching the stream, keep going) | |||
159 | // N bytes used, M samples output (one frame of data) | |||
160 | // note that after opening a file, you will ALWAYS get one N-bytes,0-sample | |||
161 | // frame, because Vorbis always "discards" the first frame. | |||
162 | // | |||
163 | // Note that on resynch, stb_vorbis will rarely consume all of the buffer, | |||
164 | // instead only datablock_length_in_bytes-3 or less. This is because it wants | |||
165 | // to avoid missing parts of a page header if they cross a datablock boundary, | |||
166 | // without writing state-machiney code to record a partial detection. | |||
167 | // | |||
168 | // The number of channels returned are stored in *channels (which can be | |||
169 | // NULL--it is always the same as the number of channels reported by | |||
170 | // get_info). *output will contain an array of float* buffers, one per | |||
171 | // channel. In other words, (*output)[0][0] contains the first sample from | |||
172 | // the first channel, and (*output)[1][0] contains the first sample from | |||
173 | // the second channel. | |||
174 | ||||
175 | extern void stb_vorbis_flush_pushdata(stb_vorbis *f); | |||
176 | // inform stb_vorbis that your next datablock will not be contiguous with | |||
177 | // previous ones (e.g. you've seeked in the data); future attempts to decode | |||
178 | // frames will cause stb_vorbis to resynchronize (as noted above), and | |||
179 | // once it sees a valid Ogg page (typically 4-8KB, as large as 64KB), it | |||
180 | // will begin decoding the _next_ frame. | |||
181 | // | |||
182 | // if you want to seek using pushdata, you need to seek in your file, then | |||
183 | // call stb_vorbis_flush_pushdata(), then start calling decoding, then once | |||
184 | // decoding is returning you data, call stb_vorbis_get_sample_offset, and | |||
185 | // if you don't like the result, seek your file again and repeat. | |||
186 | #endif | |||
187 | ||||
188 | ||||
189 | ////////// PULLING INPUT API | |||
190 | ||||
191 | #ifndef STB_VORBIS_NO_PULLDATA_API | |||
192 | // This API assumes stb_vorbis is allowed to pull data from a source-- | |||
193 | // either a block of memory containing the _entire_ vorbis stream, or a | |||
194 | // FILE * that you or it create, or possibly some other reading mechanism | |||
195 | // if you go modify the source to replace the FILE * case with some kind | |||
196 | // of callback to your code. (But if you don't support seeking, you may | |||
197 | // just want to go ahead and use pushdata.) | |||
198 | ||||
199 | #if !defined(STB_VORBIS_NO_STDIO) && !defined(STB_VORBIS_NO_INTEGER_CONVERSION) | |||
200 | extern int stb_vorbis_decode_filename(char *filename, int *channels, short **output); | |||
201 | #endif | |||
202 | extern int stb_vorbis_decode_memory(unsigned char *mem, int len, int *channels, short **output); | |||
203 | // decode an entire file and output the data interleaved into a malloc()ed | |||
204 | // buffer stored in *output. The return value is the number of samples | |||
205 | // decoded, or -1 if the file could not be opened or was not an ogg vorbis file. | |||
206 | // When you're done with it, just free() the pointer returned in *output. | |||
207 | ||||
208 | extern stb_vorbis * stb_vorbis_open_memory(unsigned char *data, int len, | |||
209 | int *error, stb_vorbis_alloc *alloc_buffer); | |||
210 | // create an ogg vorbis decoder from an ogg vorbis stream in memory (note | |||
211 | // this must be the entire stream!). on failure, returns NULL and sets *error | |||
212 | ||||
213 | #ifndef STB_VORBIS_NO_STDIO | |||
214 | extern stb_vorbis * stb_vorbis_open_filename(char *filename, | |||
215 | int *error, stb_vorbis_alloc *alloc_buffer); | |||
216 | // create an ogg vorbis decoder from a filename via fopen(). on failure, | |||
217 | // returns NULL and sets *error (possibly to VORBIS_file_open_failure). | |||
218 | ||||
219 | extern stb_vorbis * stb_vorbis_open_file(FILE *f, int close_handle_on_close, | |||
220 | int *error, stb_vorbis_alloc *alloc_buffer); | |||
221 | // create an ogg vorbis decoder from an open FILE *, looking for a stream at | |||
222 | // the _current_ seek point (ftell). on failure, returns NULL and sets *error. | |||
223 | // note that stb_vorbis must "own" this stream; if you seek it in between | |||
224 | // calls to stb_vorbis, it will become confused. Morever, if you attempt to | |||
225 | // perform stb_vorbis_seek_*() operations on this file, it will assume it | |||
226 | // owns the _entire_ rest of the file after the start point. Use the next | |||
227 | // function, stb_vorbis_open_file_section(), to limit it. | |||
228 | ||||
229 | extern stb_vorbis * stb_vorbis_open_file_section(FILE *f, int close_handle_on_close, | |||
230 | int *error, stb_vorbis_alloc *alloc_buffer, unsigned int len); | |||
231 | // create an ogg vorbis decoder from an open FILE *, looking for a stream at | |||
232 | // the _current_ seek point (ftell); the stream will be of length 'len' bytes. | |||
233 | // on failure, returns NULL and sets *error. note that stb_vorbis must "own" | |||
234 | // this stream; if you seek it in between calls to stb_vorbis, it will become | |||
235 | // confused. | |||
236 | #endif | |||
237 | ||||
238 | extern int stb_vorbis_seek_frame(stb_vorbis *f, unsigned int sample_number); | |||
239 | extern int stb_vorbis_seek(stb_vorbis *f, unsigned int sample_number); | |||
240 | // NOT WORKING YET | |||
241 | // these functions seek in the Vorbis file to (approximately) 'sample_number'. | |||
242 | // after calling seek_frame(), the next call to get_frame_*() will include | |||
243 | // the specified sample. after calling stb_vorbis_seek(), the next call to | |||
244 | // stb_vorbis_get_samples_* will start with the specified sample. If you | |||
245 | // do not need to seek to EXACTLY the target sample when using get_samples_*, | |||
246 | // you can also use seek_frame(). | |||
247 | ||||
248 | extern void stb_vorbis_seek_start(stb_vorbis *f); | |||
249 | // this function is equivalent to stb_vorbis_seek(f,0), but it | |||
250 | // actually works | |||
251 | ||||
252 | extern unsigned int stb_vorbis_stream_length_in_samples(stb_vorbis *f); | |||
253 | extern float stb_vorbis_stream_length_in_seconds(stb_vorbis *f); | |||
254 | // these functions return the total length of the vorbis stream | |||
255 | ||||
256 | extern int stb_vorbis_get_frame_float(stb_vorbis *f, int *channels, float ***output); | |||
257 | // decode the next frame and return the number of samples. the number of | |||
258 | // channels returned are stored in *channels (which can be NULL--it is always | |||
259 | // the same as the number of channels reported by get_info). *output will | |||
260 | // contain an array of float* buffers, one per channel. These outputs will | |||
261 | // be overwritten on the next call to stb_vorbis_get_frame_*. | |||
262 | // | |||
263 | // You generally should not intermix calls to stb_vorbis_get_frame_*() | |||
264 | // and stb_vorbis_get_samples_*(), since the latter calls the former. | |||
265 | ||||
266 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION | |||
267 | extern int stb_vorbis_get_frame_short_interleaved(stb_vorbis *f, int num_c, short *buffer, int num_shorts); | |||
268 | extern int stb_vorbis_get_frame_short (stb_vorbis *f, int num_c, short **buffer, int num_samples); | |||
269 | #endif | |||
270 | // decode the next frame and return the number of samples per channel. the | |||
271 | // data is coerced to the number of channels you request according to the | |||
272 | // channel coercion rules (see below). You must pass in the size of your | |||
273 | // buffer(s) so that stb_vorbis will not overwrite the end of the buffer. | |||
274 | // The maximum buffer size needed can be gotten from get_info(); however, | |||
275 | // the Vorbis I specification implies an absolute maximum of 4096 samples | |||
276 | // per channel. Note that for interleaved data, you pass in the number of | |||
277 | // shorts (the size of your array), but the return value is the number of | |||
278 | // samples per channel, not the total number of samples. | |||
279 | ||||
280 | // Channel coercion rules: | |||
281 | // Let M be the number of channels requested, and N the number of channels present, | |||
282 | // and Cn be the nth channel; let stereo L be the sum of all L and center channels, | |||
283 | // and stereo R be the sum of all R and center channels (channel assignment from the | |||
284 | // vorbis spec). | |||
285 | // M N output | |||
286 | // 1 k sum(Ck) for all k | |||
287 | // 2 * stereo L, stereo R | |||
288 | // k l k > l, the first l channels, then 0s | |||
289 | // k l k <= l, the first k channels | |||
290 | // Note that this is not _good_ surround etc. mixing at all! It's just so | |||
291 | // you get something useful. | |||
292 | ||||
293 | extern int stb_vorbis_get_samples_float_interleaved(stb_vorbis *f, int channels, float *buffer, int num_floats); | |||
294 | extern int stb_vorbis_get_samples_float(stb_vorbis *f, int channels, float **buffer, int num_samples); | |||
295 | // gets num_samples samples, not necessarily on a frame boundary--this requires | |||
296 | // buffering so you have to supply the buffers. DOES NOT APPLY THE COERCION RULES. | |||
297 | // Returns the number of samples stored per channel; it may be less than requested | |||
298 | // at the end of the file. If there are no more samples in the file, returns 0. | |||
299 | ||||
300 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION | |||
301 | extern int stb_vorbis_get_samples_short_interleaved(stb_vorbis *f, int channels, short *buffer, int num_shorts); | |||
302 | extern int stb_vorbis_get_samples_short(stb_vorbis *f, int channels, short **buffer, int num_samples); | |||
303 | #endif | |||
304 | // gets num_samples samples, not necessarily on a frame boundary--this requires | |||
305 | // buffering so you have to supply the buffers. Applies the coercion rules above | |||
306 | // to produce 'channels' channels. Returns the number of samples stored per channel; | |||
307 | // it may be less than requested at the end of the file. If there are no more | |||
308 | // samples in the file, returns 0. | |||
309 | ||||
310 | #endif | |||
311 | ||||
312 | //////// ERROR CODES | |||
313 | ||||
314 | enum STBVorbisError | |||
315 | { | |||
316 | VORBIS__no_error, | |||
317 | ||||
318 | VORBIS_need_more_data=1, // not a real error | |||
319 | ||||
320 | VORBIS_invalid_api_mixing, // can't mix API modes | |||
321 | VORBIS_outofmem, // not enough memory | |||
322 | VORBIS_feature_not_supported, // uses floor 0 | |||
323 | VORBIS_too_many_channels, // STB_VORBIS_MAX_CHANNELS is too small | |||
324 | VORBIS_file_open_failure, // fopen() failed | |||
325 | VORBIS_seek_without_length, // can't seek in unknown-length file | |||
326 | ||||
327 | VORBIS_unexpected_eof=10, // file is truncated? | |||
328 | VORBIS_seek_invalid, // seek past EOF | |||
329 | ||||
330 | // decoding errors (corrupt/invalid stream) -- you probably | |||
331 | // don't care about the exact details of these | |||
332 | ||||
333 | // vorbis errors: | |||
334 | VORBIS_invalid_setup=20, | |||
335 | VORBIS_invalid_stream, | |||
336 | ||||
337 | // ogg errors: | |||
338 | VORBIS_missing_capture_pattern=30, | |||
339 | VORBIS_invalid_stream_structure_version, | |||
340 | VORBIS_continued_packet_flag_invalid, | |||
341 | VORBIS_incorrect_stream_serial_number, | |||
342 | VORBIS_invalid_first_page, | |||
343 | VORBIS_bad_packet_type, | |||
344 | VORBIS_cant_find_last_page, | |||
345 | VORBIS_seek_failed, | |||
346 | }; | |||
347 | ||||
348 | ||||
349 | #ifdef __cplusplus | |||
350 | } | |||
351 | #endif | |||
352 | ||||
353 | #endif // STB_VORBIS_INCLUDE_STB_VORBIS_H | |||
354 | // | |||
355 | // HEADER ENDS HERE | |||
356 | // | |||
357 | ////////////////////////////////////////////////////////////////////////////// | |||
358 | ||||
359 | #ifndef STB_VORBIS_HEADER_ONLY | |||
360 | ||||
361 | // global configuration settings (e.g. set these in the project/makefile), | |||
362 | // or just set them in this file at the top (although ideally the first few | |||
363 | // should be visible when the header file is compiled too, although it's not | |||
364 | // crucial) | |||
365 | ||||
366 | // STB_VORBIS_NO_PUSHDATA_API | |||
367 | // does not compile the code for the various stb_vorbis_*_pushdata() | |||
368 | // functions | |||
369 | // #define STB_VORBIS_NO_PUSHDATA_API | |||
370 | ||||
371 | // STB_VORBIS_NO_PULLDATA_API | |||
372 | // does not compile the code for the non-pushdata APIs | |||
373 | // #define STB_VORBIS_NO_PULLDATA_API | |||
374 | ||||
375 | // STB_VORBIS_NO_STDIO | |||
376 | // does not compile the code for the APIs that use FILE *s internally | |||
377 | // or externally (implied by STB_VORBIS_NO_PULLDATA_API) | |||
378 | // #define STB_VORBIS_NO_STDIO | |||
379 | ||||
380 | // STB_VORBIS_NO_INTEGER_CONVERSION | |||
381 | // does not compile the code for converting audio sample data from | |||
382 | // float to integer (implied by STB_VORBIS_NO_PULLDATA_API) | |||
383 | // #define STB_VORBIS_NO_INTEGER_CONVERSION | |||
384 | ||||
385 | // STB_VORBIS_NO_FAST_SCALED_FLOAT | |||
386 | // does not use a fast float-to-int trick to accelerate float-to-int on | |||
387 | // most platforms which requires endianness be defined correctly. | |||
388 | //#define STB_VORBIS_NO_FAST_SCALED_FLOAT | |||
389 | ||||
390 | ||||
391 | // STB_VORBIS_MAX_CHANNELS [number] | |||
392 | // globally define this to the maximum number of channels you need. | |||
393 | // The spec does not put a restriction on channels except that | |||
394 | // the count is stored in a byte, so 255 is the hard limit. | |||
395 | // Reducing this saves about 16 bytes per value, so using 16 saves | |||
396 | // (255-16)*16 or around 4KB. Plus anything other memory usage | |||
397 | // I forgot to account for. Can probably go as low as 8 (7.1 audio), | |||
398 | // 6 (5.1 audio), or 2 (stereo only). | |||
399 | #ifndef STB_VORBIS_MAX_CHANNELS16 | |||
400 | #define STB_VORBIS_MAX_CHANNELS16 16 // enough for anyone? | |||
401 | #endif | |||
402 | ||||
403 | // STB_VORBIS_PUSHDATA_CRC_COUNT [number] | |||
404 | // after a flush_pushdata(), stb_vorbis begins scanning for the | |||
405 | // next valid page, without backtracking. when it finds something | |||
406 | // that looks like a page, it streams through it and verifies its | |||
407 | // CRC32. Should that validation fail, it keeps scanning. But it's | |||
408 | // possible that _while_ streaming through to check the CRC32 of | |||
409 | // one candidate page, it sees another candidate page. This #define | |||
410 | // determines how many "overlapping" candidate pages it can search | |||
411 | // at once. Note that "real" pages are typically ~4KB to ~8KB, whereas | |||
412 | // garbage pages could be as big as 64KB, but probably average ~16KB. | |||
413 | // So don't hose ourselves by scanning an apparent 64KB page and | |||
414 | // missing a ton of real ones in the interim; so minimum of 2 | |||
415 | #ifndef STB_VORBIS_PUSHDATA_CRC_COUNT4 | |||
416 | #define STB_VORBIS_PUSHDATA_CRC_COUNT4 4 | |||
417 | #endif | |||
418 | ||||
419 | // STB_VORBIS_FAST_HUFFMAN_LENGTH [number] | |||
420 | // sets the log size of the huffman-acceleration table. Maximum | |||
421 | // supported value is 24. with larger numbers, more decodings are O(1), | |||
422 | // but the table size is larger so worse cache missing, so you'll have | |||
423 | // to probe (and try multiple ogg vorbis files) to find the sweet spot. | |||
424 | #ifndef STB_VORBIS_FAST_HUFFMAN_LENGTH10 | |||
425 | #define STB_VORBIS_FAST_HUFFMAN_LENGTH10 10 | |||
426 | #endif | |||
427 | ||||
428 | // STB_VORBIS_FAST_BINARY_LENGTH [number] | |||
429 | // sets the log size of the binary-search acceleration table. this | |||
430 | // is used in similar fashion to the fast-huffman size to set initial | |||
431 | // parameters for the binary search | |||
432 | ||||
433 | // STB_VORBIS_FAST_HUFFMAN_INT | |||
434 | // The fast huffman tables are much more efficient if they can be | |||
435 | // stored as 16-bit results instead of 32-bit results. This restricts | |||
436 | // the codebooks to having only 65535 possible outcomes, though. | |||
437 | // (At least, accelerated by the huffman table.) | |||
438 | #ifndef STB_VORBIS_FAST_HUFFMAN_INT | |||
439 | #define STB_VORBIS_FAST_HUFFMAN_SHORT | |||
440 | #endif | |||
441 | ||||
442 | // STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH | |||
443 | // If the 'fast huffman' search doesn't succeed, then stb_vorbis falls | |||
444 | // back on binary searching for the correct one. This requires storing | |||
445 | // extra tables with the huffman codes in sorted order. Defining this | |||
446 | // symbol trades off space for speed by forcing a linear search in the | |||
447 | // non-fast case, except for "sparse" codebooks. | |||
448 | // #define STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH | |||
449 | ||||
450 | // STB_VORBIS_DIVIDES_IN_RESIDUE | |||
451 | // stb_vorbis precomputes the result of the scalar residue decoding | |||
452 | // that would otherwise require a divide per chunk. you can trade off | |||
453 | // space for time by defining this symbol. | |||
454 | // #define STB_VORBIS_DIVIDES_IN_RESIDUE | |||
455 | ||||
456 | // STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
457 | // vorbis VQ codebooks can be encoded two ways: with every case explicitly | |||
458 | // stored, or with all elements being chosen from a small range of values, | |||
459 | // and all values possible in all elements. By default, stb_vorbis expands | |||
460 | // this latter kind out to look like the former kind for ease of decoding, | |||
461 | // because otherwise an integer divide-per-vector-element is required to | |||
462 | // unpack the index. If you define STB_VORBIS_DIVIDES_IN_CODEBOOK, you can | |||
463 | // trade off storage for speed. | |||
464 | //#define STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
465 | ||||
466 | // STB_VORBIS_CODEBOOK_SHORTS | |||
467 | // The vorbis file format encodes VQ codebook floats as ax+b where a and | |||
468 | // b are floating point per-codebook constants, and x is a 16-bit int. | |||
469 | // Normally, stb_vorbis decodes them to floats rather than leaving them | |||
470 | // as 16-bit ints and computing ax+b while decoding. This is a speed/space | |||
471 | // tradeoff; you can save space by defining this flag. | |||
472 | #ifndef STB_VORBIS_CODEBOOK_SHORTS | |||
473 | #define STB_VORBIS_CODEBOOK_FLOATS | |||
474 | #endif | |||
475 | ||||
476 | // STB_VORBIS_DIVIDE_TABLE | |||
477 | // this replaces small integer divides in the floor decode loop with | |||
478 | // table lookups. made less than 1% difference, so disabled by default. | |||
479 | ||||
480 | // STB_VORBIS_NO_INLINE_DECODE | |||
481 | // disables the inlining of the scalar codebook fast-huffman decode. | |||
482 | // might save a little codespace; useful for debugging | |||
483 | // #define STB_VORBIS_NO_INLINE_DECODE | |||
484 | ||||
485 | // STB_VORBIS_NO_DEFER_FLOOR | |||
486 | // Normally we only decode the floor without synthesizing the actual | |||
487 | // full curve. We can instead synthesize the curve immediately. This | |||
488 | // requires more memory and is very likely slower, so I don't think | |||
489 | // you'd ever want to do it except for debugging. | |||
490 | // #define STB_VORBIS_NO_DEFER_FLOOR | |||
491 | ||||
492 | ||||
493 | ||||
494 | ||||
495 | ////////////////////////////////////////////////////////////////////////////// | |||
496 | ||||
497 | #ifdef STB_VORBIS_NO_PULLDATA_API | |||
498 | #define STB_VORBIS_NO_INTEGER_CONVERSION | |||
499 | #define STB_VORBIS_NO_STDIO | |||
500 | #endif | |||
501 | ||||
502 | #if defined(STB_VORBIS_NO_CRT) && !defined(STB_VORBIS_NO_STDIO) | |||
503 | #define STB_VORBIS_NO_STDIO 1 | |||
504 | #endif | |||
505 | ||||
506 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION | |||
507 | #ifndef STB_VORBIS_NO_FAST_SCALED_FLOAT | |||
508 | ||||
509 | // only need endianness for fast-float-to-int, which we don't | |||
510 | // use for pushdata | |||
511 | ||||
512 | #ifndef STB_VORBIS_BIG_ENDIAN | |||
513 | #define STB_VORBIS_ENDIAN0 0 | |||
514 | #else | |||
515 | #define STB_VORBIS_ENDIAN0 1 | |||
516 | #endif | |||
517 | ||||
518 | #endif | |||
519 | #endif | |||
520 | ||||
521 | ||||
522 | #ifndef STB_VORBIS_NO_STDIO | |||
523 | #include <stdio.h> | |||
524 | #endif | |||
525 | ||||
526 | #ifndef STB_VORBIS_NO_CRT | |||
527 | #include <stdlib.h> | |||
528 | #include <string.h> | |||
529 | #include <assert.h> | |||
530 | #include <math.h> | |||
531 | #else | |||
532 | #define NULL((void*)0) 0 | |||
533 | #endif | |||
534 | ||||
535 | #ifndef _MSC_VER | |||
536 | #if __GNUC__4 | |||
537 | #define __forceinlineinline inline | |||
538 | #else | |||
539 | #define __forceinlineinline | |||
540 | #endif | |||
541 | #endif | |||
542 | ||||
543 | #if STB_VORBIS_MAX_CHANNELS16 > 256 | |||
544 | #error "Value of STB_VORBIS_MAX_CHANNELS outside of allowed range" | |||
545 | #endif | |||
546 | ||||
547 | #if STB_VORBIS_FAST_HUFFMAN_LENGTH10 > 24 | |||
548 | #error "Value of STB_VORBIS_FAST_HUFFMAN_LENGTH outside of allowed range" | |||
549 | #endif | |||
550 | ||||
551 | ||||
552 | #define MAX_BLOCKSIZE_LOG13 13 // from specification | |||
553 | #define MAX_BLOCKSIZE(1 << 13) (1 << MAX_BLOCKSIZE_LOG13) | |||
554 | ||||
555 | ||||
556 | typedef unsigned char uint8; | |||
557 | typedef signed char int8; | |||
558 | typedef unsigned short uint16; | |||
559 | typedef signed short int16; | |||
560 | typedef unsigned int uint32; | |||
561 | typedef signed int int32; | |||
562 | ||||
563 | #ifndef TRUE1 | |||
564 | #define TRUE1 1 | |||
565 | #define FALSE0 0 | |||
566 | #endif | |||
567 | ||||
568 | #ifdef STB_VORBIS_CODEBOOK_FLOATS | |||
569 | typedef float codetype; | |||
570 | #else | |||
571 | typedef uint16 codetype; | |||
572 | #endif | |||
573 | ||||
574 | // @NOTE | |||
575 | // | |||
576 | // Some arrays below are tagged "//varies", which means it's actually | |||
577 | // a variable-sized piece of data, but rather than malloc I assume it's | |||
578 | // small enough it's better to just allocate it all together with the | |||
579 | // main thing | |||
580 | // | |||
581 | // Most of the variables are specified with the smallest size I could pack | |||
582 | // them into. It might give better performance to make them all full-sized | |||
583 | // integers. It should be safe to freely rearrange the structures or change | |||
584 | // the sizes larger--nothing relies on silently truncating etc., nor the | |||
585 | // order of variables. | |||
586 | ||||
587 | #define FAST_HUFFMAN_TABLE_SIZE(1 << 10) (1 << STB_VORBIS_FAST_HUFFMAN_LENGTH10) | |||
588 | #define FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1) (FAST_HUFFMAN_TABLE_SIZE(1 << 10) - 1) | |||
589 | ||||
590 | typedef struct | |||
591 | { | |||
592 | int dimensions, entries; | |||
593 | uint8 *codeword_lengths; | |||
594 | float minimum_value; | |||
595 | float delta_value; | |||
596 | uint8 value_bits; | |||
597 | uint8 lookup_type; | |||
598 | uint8 sequence_p; | |||
599 | uint8 sparse; | |||
600 | uint32 lookup_values; | |||
601 | codetype *multiplicands; | |||
602 | uint32 *codewords; | |||
603 | #ifdef STB_VORBIS_FAST_HUFFMAN_SHORT | |||
604 | int16 fast_huffman[FAST_HUFFMAN_TABLE_SIZE(1 << 10)]; | |||
605 | #else | |||
606 | int32 fast_huffman[FAST_HUFFMAN_TABLE_SIZE(1 << 10)]; | |||
607 | #endif | |||
608 | uint32 *sorted_codewords; | |||
609 | int *sorted_values; | |||
610 | int sorted_entries; | |||
611 | } Codebook; | |||
612 | ||||
613 | typedef struct | |||
614 | { | |||
615 | uint8 order; | |||
616 | uint16 rate; | |||
617 | uint16 bark_map_size; | |||
618 | uint8 amplitude_bits; | |||
619 | uint8 amplitude_offset; | |||
620 | uint8 number_of_books; | |||
621 | uint8 book_list[16]; // varies | |||
622 | } Floor0; | |||
623 | ||||
624 | typedef struct | |||
625 | { | |||
626 | uint8 partitions; | |||
627 | uint8 partition_class_list[32]; // varies | |||
628 | uint8 class_dimensions[16]; // varies | |||
629 | uint8 class_subclasses[16]; // varies | |||
630 | uint8 class_masterbooks[16]; // varies | |||
631 | int16 subclass_books[16][8]; // varies | |||
632 | uint16 Xlist[31*8+2]; // varies | |||
633 | uint8 sorted_order[31*8+2]; | |||
634 | uint8 neighbors[31*8+2][2]; | |||
635 | uint8 floor1_multiplier; | |||
636 | uint8 rangebits; | |||
637 | int values; | |||
638 | } Floor1; | |||
639 | ||||
640 | typedef union | |||
641 | { | |||
642 | Floor0 floor0; | |||
643 | Floor1 floor1; | |||
644 | } Floor; | |||
645 | ||||
646 | typedef struct | |||
647 | { | |||
648 | uint32 begin, end; | |||
649 | uint32 part_size; | |||
650 | uint8 classifications; | |||
651 | uint8 classbook; | |||
652 | uint8 **classdata; | |||
653 | int16 (*residue_books)[8]; | |||
654 | } Residue; | |||
655 | ||||
656 | typedef struct | |||
657 | { | |||
658 | uint8 magnitude; | |||
659 | uint8 angle; | |||
660 | uint8 mux; | |||
661 | } MappingChannel; | |||
662 | ||||
663 | typedef struct | |||
664 | { | |||
665 | uint16 coupling_steps; | |||
666 | MappingChannel *chan; | |||
667 | uint8 submaps; | |||
668 | uint8 submap_floor[15]; // varies | |||
669 | uint8 submap_residue[15]; // varies | |||
670 | } Mapping; | |||
671 | ||||
672 | typedef struct | |||
673 | { | |||
674 | uint8 blockflag; | |||
675 | uint8 mapping; | |||
676 | uint16 windowtype; | |||
677 | uint16 transformtype; | |||
678 | } Mode; | |||
679 | ||||
680 | typedef struct | |||
681 | { | |||
682 | uint32 goal_crc; // expected crc if match | |||
683 | int bytes_left; // bytes left in packet | |||
684 | uint32 crc_so_far; // running crc | |||
685 | int bytes_done; // bytes processed in _current_ chunk | |||
686 | uint32 sample_loc; // granule pos encoded in page | |||
687 | } CRCscan; | |||
688 | ||||
689 | typedef struct | |||
690 | { | |||
691 | uint32 page_start, page_end; | |||
692 | uint32 after_previous_page_start; | |||
693 | uint32 first_decoded_sample; | |||
694 | uint32 last_decoded_sample; | |||
695 | } ProbedPage; | |||
696 | ||||
697 | struct stb_vorbis | |||
698 | { | |||
699 | // user-accessible info | |||
700 | unsigned int sample_rate; | |||
701 | int channels; | |||
702 | ||||
703 | unsigned int setup_memory_required; | |||
704 | unsigned int temp_memory_required; | |||
705 | unsigned int setup_temp_memory_required; | |||
706 | ||||
707 | // input config | |||
708 | #ifndef STB_VORBIS_NO_STDIO | |||
709 | FILE *f; | |||
710 | uint32 f_start; | |||
711 | int close_on_free; | |||
712 | #endif | |||
713 | ||||
714 | uint8 *stream; | |||
715 | uint8 *stream_start; | |||
716 | uint8 *stream_end; | |||
717 | ||||
718 | uint32 stream_len; | |||
719 | ||||
720 | uint8 push_mode; | |||
721 | ||||
722 | uint32 first_audio_page_offset; | |||
723 | ||||
724 | ProbedPage p_first, p_last; | |||
725 | ||||
726 | // memory management | |||
727 | stb_vorbis_alloc alloc; | |||
728 | int setup_offset; | |||
729 | int temp_offset; | |||
730 | ||||
731 | // run-time results | |||
732 | int eof; | |||
733 | enum STBVorbisError error; | |||
734 | ||||
735 | // user-useful data | |||
736 | ||||
737 | // header info | |||
738 | int blocksize[2]; | |||
739 | int blocksize_0, blocksize_1; | |||
740 | int codebook_count; | |||
741 | Codebook *codebooks; | |||
742 | int floor_count; | |||
743 | uint16 floor_types[64]; // varies | |||
744 | Floor *floor_config; | |||
745 | int residue_count; | |||
746 | uint16 residue_types[64]; // varies | |||
747 | Residue *residue_config; | |||
748 | int mapping_count; | |||
749 | Mapping *mapping; | |||
750 | int mode_count; | |||
751 | Mode mode_config[64]; // varies | |||
752 | ||||
753 | uint32 total_samples; | |||
754 | ||||
755 | // decode buffer | |||
756 | float *channel_buffers[STB_VORBIS_MAX_CHANNELS16]; | |||
757 | float *outputs [STB_VORBIS_MAX_CHANNELS16]; | |||
758 | ||||
759 | float *previous_window[STB_VORBIS_MAX_CHANNELS16]; | |||
760 | int previous_length; | |||
761 | ||||
762 | #ifndef STB_VORBIS_NO_DEFER_FLOOR | |||
763 | int16 *finalY[STB_VORBIS_MAX_CHANNELS16]; | |||
764 | #else | |||
765 | float *floor_buffers[STB_VORBIS_MAX_CHANNELS16]; | |||
766 | #endif | |||
767 | ||||
768 | uint32 current_loc; // sample location of next frame to decode | |||
769 | int current_loc_valid; | |||
770 | ||||
771 | // per-blocksize precomputed data | |||
772 | ||||
773 | // twiddle factors | |||
774 | float *A[2],*B[2],*C(2 | 4 | 1)[2]; | |||
775 | float *window[2]; | |||
776 | uint16 *bit_reverse[2]; | |||
777 | ||||
778 | // current page/packet/segment streaming info | |||
779 | uint32 serial; // stream serial number for verification | |||
780 | int last_page; | |||
781 | int segment_count; | |||
782 | uint8 segments[255]; | |||
783 | uint8 page_flag; | |||
784 | uint8 bytes_in_seg; | |||
785 | uint8 first_decode; | |||
786 | int next_seg; | |||
787 | int last_seg; // flag that we're on the last segment | |||
788 | int last_seg_which; // what was the segment number of the last seg? | |||
789 | uint32 acc; | |||
790 | int valid_bits; | |||
791 | int packet_bytes; | |||
792 | int end_seg_with_known_loc; | |||
793 | uint32 known_loc_for_packet; | |||
794 | int discard_samples_deferred; | |||
795 | uint32 samples_output; | |||
796 | ||||
797 | // push mode scanning | |||
798 | int page_crc_tests; // only in push_mode: number of tests active; -1 if not searching | |||
799 | #ifndef STB_VORBIS_NO_PUSHDATA_API | |||
800 | CRCscan scan[STB_VORBIS_PUSHDATA_CRC_COUNT4]; | |||
801 | #endif | |||
802 | ||||
803 | // sample-access | |||
804 | int channel_buffer_start; | |||
805 | int channel_buffer_end; | |||
806 | }; | |||
807 | ||||
808 | extern int my_prof(int slot); | |||
809 | //#define stb_prof my_prof | |||
810 | ||||
811 | #ifndef stb_prof | |||
812 | #define stb_prof(x)(void)0 (void)0 | |||
813 | #endif | |||
814 | ||||
815 | #if defined(STB_VORBIS_NO_PUSHDATA_API) | |||
816 | #define IS_PUSH_MODE(f)((f)->push_mode) FALSE0 | |||
817 | #elif defined(STB_VORBIS_NO_PULLDATA_API) | |||
818 | #define IS_PUSH_MODE(f)((f)->push_mode) TRUE1 | |||
819 | #else | |||
820 | #define IS_PUSH_MODE(f)((f)->push_mode) ((f)->push_mode) | |||
821 | #endif | |||
822 | ||||
823 | typedef struct stb_vorbis vorb; | |||
824 | ||||
825 | static int error(vorb *f, enum STBVorbisError e) | |||
826 | { | |||
827 | f->error = e; | |||
828 | if (!f->eof && e != VORBIS_need_more_data) { | |||
829 | f->error=e; // breakpoint for debugging | |||
830 | } | |||
831 | return 0; | |||
832 | } | |||
833 | ||||
834 | ||||
835 | // these functions are used for allocating temporary memory | |||
836 | // while decoding. if you can afford the stack space, use | |||
837 | // alloca(); otherwise, provide a temp buffer and it will | |||
838 | // allocate out of those. | |||
839 | ||||
840 | #define array_size_required(count,size)(count*(sizeof(void *)+(size))) (count*(sizeof(void *)+(size))) | |||
841 | ||||
842 | #define temp_alloc(f,size)(f->alloc.alloc_buffer ? setup_temp_malloc(f,size) : alloca (size)) (f->alloc.alloc_buffer ? setup_temp_malloc(f,size) : alloca(size)) | |||
843 | #ifdef dealloca | |||
844 | #define temp_free(f,p)0 (f->alloc.alloc_buffer ? 0 : dealloca(size)) | |||
845 | #else | |||
846 | #define temp_free(f,p)0 0 | |||
847 | #endif | |||
848 | #define temp_alloc_save(f)((f)->temp_offset) ((f)->temp_offset) | |||
849 | #define temp_alloc_restore(f,p)((f)->temp_offset = (p)) ((f)->temp_offset = (p)) | |||
850 | ||||
851 | #define temp_block_array(f,count,size)make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(count*(sizeof(void *)+(size)))) : alloca((count*(sizeof(void *)+(size))))), count, size) make_block_array(temp_alloc(f,array_size_required(count,size))(f->alloc.alloc_buffer ? setup_temp_malloc(f,(count*(sizeof (void *)+(size)))) : alloca((count*(sizeof(void *)+(size))))), count, size) | |||
852 | ||||
853 | // given a sufficiently large block of memory, make an array of pointers to subblocks of it | |||
854 | static void *make_block_array(void *mem, int count, int size) | |||
855 | { | |||
856 | int i; | |||
857 | void ** p = (void **) mem; | |||
858 | char *q = (char *) (p + count); | |||
859 | for (i=0; i < count; ++i) { | |||
860 | p[i] = q; | |||
861 | q += size; | |||
862 | } | |||
863 | return p; | |||
864 | } | |||
865 | ||||
866 | static void *setup_malloc(vorb *f, int sz) | |||
867 | { | |||
868 | sz = (sz+3) & ~3; | |||
869 | f->setup_memory_required += sz; | |||
870 | if (f->alloc.alloc_buffer) { | |||
871 | void *p = (char *) f->alloc.alloc_buffer + f->setup_offset; | |||
872 | if (f->setup_offset + sz > f->temp_offset) return NULL((void*)0); | |||
873 | f->setup_offset += sz; | |||
874 | return p; | |||
875 | } | |||
876 | return sz ? malloc(sz) : NULL((void*)0); | |||
877 | } | |||
878 | ||||
879 | static void setup_free(vorb *f, void *p) | |||
880 | { | |||
881 | if (f->alloc.alloc_buffer) return; // do nothing; setup mem is not a stack | |||
882 | free(p); | |||
883 | } | |||
884 | ||||
885 | static void *setup_temp_malloc(vorb *f, int sz) | |||
886 | { | |||
887 | sz = (sz+3) & ~3; | |||
888 | if (f->alloc.alloc_buffer) { | |||
889 | if (f->temp_offset - sz < f->setup_offset) return NULL((void*)0); | |||
890 | f->temp_offset -= sz; | |||
891 | return (char *) f->alloc.alloc_buffer + f->temp_offset; | |||
892 | } | |||
893 | return malloc(sz); | |||
894 | } | |||
895 | ||||
896 | static void setup_temp_free(vorb *f, void *p, size_t sz) | |||
897 | { | |||
898 | if (f->alloc.alloc_buffer) { | |||
899 | f->temp_offset += (sz+3)&~3; | |||
900 | return; | |||
901 | } | |||
902 | free(p); | |||
903 | } | |||
904 | ||||
905 | #define CRC32_POLY0x04c11db7 0x04c11db7 // from spec | |||
906 | ||||
907 | static uint32 crc_table[256]; | |||
908 | static void crc32_init(void) | |||
909 | { | |||
910 | int i,j; | |||
911 | uint32 s; | |||
912 | for(i=0; i < 256; i++) { | |||
913 | for (s=i<<24, j=0; j < 8; ++j) | |||
914 | s = (s << 1) ^ (s >= (1<<31) ? CRC32_POLY0x04c11db7 : 0); | |||
915 | crc_table[i] = s; | |||
916 | } | |||
917 | } | |||
918 | ||||
919 | static __forceinlineinline uint32 crc32_update(uint32 crc, uint8 byte) | |||
920 | { | |||
921 | return (crc << 8) ^ crc_table[byte ^ (crc >> 24)]; | |||
922 | } | |||
923 | ||||
924 | ||||
925 | // used in setup, and for huffman that doesn't go fast path | |||
926 | static unsigned int bit_reverse(unsigned int n) | |||
927 | { | |||
928 | n = ((n & 0xAAAAAAAA) >> 1) | ((n & 0x55555555) << 1); | |||
929 | n = ((n & 0xCCCCCCCC) >> 2) | ((n & 0x33333333) << 2); | |||
930 | n = ((n & 0xF0F0F0F0) >> 4) | ((n & 0x0F0F0F0F) << 4); | |||
931 | n = ((n & 0xFF00FF00) >> 8) | ((n & 0x00FF00FF) << 8); | |||
932 | return (n >> 16) | (n << 16); | |||
933 | } | |||
934 | ||||
935 | static float square(float x) | |||
936 | { | |||
937 | return x*x; | |||
938 | } | |||
939 | ||||
940 | // this is a weird definition of log2() for which log2(1) = 1, log2(2) = 2, log2(4) = 3 | |||
941 | // as required by the specification. fast(?) implementation from stb.h | |||
942 | // @OPTIMIZE: called multiple times per-packet with "constants"; move to setup | |||
943 | static int ilog(int32 n) | |||
944 | { | |||
945 | static signed char log2_4[16] = { 0,1,2,2,3,3,3,3,4,4,4,4,4,4,4,4 }; | |||
946 | ||||
947 | // 2 compares if n < 16, 3 compares otherwise (4 if signed or n > 1<<29) | |||
948 | if (n < (1U << 14)) | |||
949 | if (n < (1U << 4)) return 0 + log2_4[n ]; | |||
950 | else if (n < (1U << 9)) return 5 + log2_4[n >> 5]; | |||
951 | else return 10 + log2_4[n >> 10]; | |||
952 | else if (n < (1U << 24)) | |||
953 | if (n < (1U << 19)) return 15 + log2_4[n >> 15]; | |||
954 | else return 20 + log2_4[n >> 20]; | |||
955 | else if (n < (1U << 29)) return 25 + log2_4[n >> 25]; | |||
956 | else if (n < (1U << 31)) return 30 + log2_4[n >> 30]; | |||
957 | else return 0; // signed n returns 0 | |||
958 | } | |||
959 | ||||
960 | #ifndef M_PI3.14159265358979323846 | |||
961 | #define M_PI3.14159265358979323846 3.14159265358979323846264f // from CRC | |||
962 | #endif | |||
963 | ||||
964 | // code length assigned to a value with no huffman encoding | |||
965 | #define NO_CODE255 255 | |||
966 | ||||
967 | /////////////////////// LEAF SETUP FUNCTIONS ////////////////////////// | |||
968 | // | |||
969 | // these functions are only called at setup, and only a few times | |||
970 | // per file | |||
971 | ||||
972 | static float float32_unpack(uint32 x) | |||
973 | { | |||
974 | // from the specification | |||
975 | uint32 mantissa = x & 0x1fffff; | |||
976 | uint32 sign = x & 0x80000000; | |||
977 | uint32 exp = (x & 0x7fe00000) >> 21; | |||
978 | double res = sign ? -(double)mantissa : (double)mantissa; | |||
979 | return (float) ldexp((float)res, exp-788); | |||
980 | } | |||
981 | ||||
982 | ||||
983 | // zlib & jpeg huffman tables assume that the output symbols | |||
984 | // can either be arbitrarily arranged, or have monotonically | |||
985 | // increasing frequencies--they rely on the lengths being sorted; | |||
986 | // this makes for a very simple generation algorithm. | |||
987 | // vorbis allows a huffman table with non-sorted lengths. This | |||
988 | // requires a more sophisticated construction, since symbols in | |||
989 | // order do not map to huffman codes "in order". | |||
990 | static void add_entry(Codebook *c, uint32 huff_code, int symbol, int count, int len, uint32 *values) | |||
991 | { | |||
992 | if (!c->sparse) { | |||
993 | c->codewords [symbol] = huff_code; | |||
994 | } else { | |||
995 | c->codewords [count] = huff_code; | |||
996 | c->codeword_lengths[count] = len; | |||
997 | values [count] = symbol; | |||
998 | } | |||
999 | } | |||
1000 | ||||
1001 | static int compute_codewords(Codebook *c, uint8 *len, int n, uint32 *values) | |||
1002 | { | |||
1003 | int i,k,m=0; | |||
1004 | uint32 available[32]; | |||
1005 | ||||
1006 | memset(available, 0, sizeof(available)); | |||
1007 | // find the first entry | |||
1008 | for (k=0; k < n; ++k) if (len[k] < NO_CODE255) break; | |||
1009 | if (k == n) { assert(c->sorted_entries == 0)((c->sorted_entries == 0) ? (void)0 : _assert("c->sorted_entries == 0" , "src/siege/internal/stb/stb_vorbis.c", 1009)); return TRUE1; } | |||
1010 | // add to the list | |||
1011 | add_entry(c, 0, k, m++, len[k], values); | |||
1012 | // add all available leaves | |||
1013 | for (i=1; i <= len[k]; ++i) | |||
1014 | available[i] = 1 << (32-i); | |||
1015 | // note that the above code treats the first case specially, | |||
1016 | // but it's really the same as the following code, so they | |||
1017 | // could probably be combined (except the initial code is 0, | |||
1018 | // and I use 0 in available[] to mean 'empty') | |||
1019 | for (i=k+1; i < n; ++i) { | |||
1020 | uint32 res; | |||
1021 | int z = len[i], y; | |||
1022 | if (z == NO_CODE255) continue; | |||
1023 | // find lowest available leaf (should always be earliest, | |||
1024 | // which is what the specification calls for) | |||
1025 | // note that this property, and the fact we can never have | |||
1026 | // more than one free leaf at a given level, isn't totally | |||
1027 | // trivial to prove, but it seems true and the assert never | |||
1028 | // fires, so! | |||
1029 | while (z > 0 && !available[z]) --z; | |||
1030 | if (z == 0) { assert(0)((0) ? (void)0 : _assert("0", "src/siege/internal/stb/stb_vorbis.c" , 1030)); return FALSE0; } | |||
1031 | res = available[z]; | |||
1032 | available[z] = 0; | |||
1033 | add_entry(c, bit_reverse(res), i, m++, len[i], values); | |||
1034 | // propogate availability up the tree | |||
1035 | if (z != len[i]) { | |||
1036 | for (y=len[i]; y > z; --y) { | |||
1037 | assert(available[y] == 0)((available[y] == 0) ? (void)0 : _assert("available[y] == 0", "src/siege/internal/stb/stb_vorbis.c", 1037)); | |||
1038 | available[y] = res + (1 << (32-y)); | |||
1039 | } | |||
1040 | } | |||
1041 | } | |||
1042 | return TRUE1; | |||
1043 | } | |||
1044 | ||||
1045 | // accelerated huffman table allows fast O(1) match of all symbols | |||
1046 | // of length <= STB_VORBIS_FAST_HUFFMAN_LENGTH | |||
1047 | static void compute_accelerated_huffman(Codebook *c) | |||
1048 | { | |||
1049 | int i, len; | |||
1050 | for (i=0; i < FAST_HUFFMAN_TABLE_SIZE(1 << 10); ++i) | |||
1051 | c->fast_huffman[i] = -1; | |||
1052 | ||||
1053 | len = c->sparse ? c->sorted_entries : c->entries; | |||
1054 | #ifdef STB_VORBIS_FAST_HUFFMAN_SHORT | |||
1055 | if (len > 32767) len = 32767; // largest possible value we can encode! | |||
1056 | #endif | |||
1057 | for (i=0; i < len; ++i) { | |||
1058 | if (c->codeword_lengths[i] <= STB_VORBIS_FAST_HUFFMAN_LENGTH10) { | |||
1059 | uint32 z = c->sparse ? bit_reverse(c->sorted_codewords[i]) : c->codewords[i]; | |||
1060 | // set table entries for all bit combinations in the higher bits | |||
1061 | while (z < FAST_HUFFMAN_TABLE_SIZE(1 << 10)) { | |||
1062 | c->fast_huffman[z] = i; | |||
1063 | z += 1 << c->codeword_lengths[i]; | |||
1064 | } | |||
1065 | } | |||
1066 | } | |||
1067 | } | |||
1068 | ||||
1069 | static int uint32_compare(const void *p, const void *q) | |||
1070 | { | |||
1071 | uint32 x = * (uint32 *) p; | |||
1072 | uint32 y = * (uint32 *) q; | |||
1073 | return x < y ? -1 : x > y; | |||
1074 | } | |||
1075 | ||||
1076 | static int include_in_sort(Codebook *c, uint8 len) | |||
1077 | { | |||
1078 | if (c->sparse) { assert(len != NO_CODE)((len != 255) ? (void)0 : _assert("len != NO_CODE", "src/siege/internal/stb/stb_vorbis.c" , 1078)); return TRUE1; } | |||
1079 | if (len == NO_CODE255) return FALSE0; | |||
1080 | if (len > STB_VORBIS_FAST_HUFFMAN_LENGTH10) return TRUE1; | |||
1081 | return FALSE0; | |||
1082 | } | |||
1083 | ||||
1084 | // if the fast table above doesn't work, we want to binary | |||
1085 | // search them... need to reverse the bits | |||
1086 | static void compute_sorted_huffman(Codebook *c, uint8 *lengths, uint32 *values) | |||
1087 | { | |||
1088 | int i, len; | |||
1089 | // build a list of all the entries | |||
1090 | // OPTIMIZATION: don't include the short ones, since they'll be caught by FAST_HUFFMAN. | |||
1091 | // this is kind of a frivolous optimization--I don't see any performance improvement, | |||
1092 | // but it's like 4 extra lines of code, so. | |||
1093 | if (!c->sparse) { | |||
1094 | int k = 0; | |||
1095 | for (i=0; i < c->entries; ++i) | |||
1096 | if (include_in_sort(c, lengths[i])) | |||
1097 | c->sorted_codewords[k++] = bit_reverse(c->codewords[i]); | |||
1098 | assert(k == c->sorted_entries)((k == c->sorted_entries) ? (void)0 : _assert("k == c->sorted_entries" , "src/siege/internal/stb/stb_vorbis.c", 1098)); | |||
1099 | } else { | |||
1100 | for (i=0; i < c->sorted_entries; ++i) | |||
1101 | c->sorted_codewords[i] = bit_reverse(c->codewords[i]); | |||
1102 | } | |||
1103 | ||||
1104 | qsort(c->sorted_codewords, c->sorted_entries, sizeof(c->sorted_codewords[0]), uint32_compare); | |||
1105 | c->sorted_codewords[c->sorted_entries] = 0xffffffff; | |||
1106 | ||||
1107 | len = c->sparse ? c->sorted_entries : c->entries; | |||
1108 | // now we need to indicate how they correspond; we could either | |||
1109 | // #1: sort a different data structure that says who they correspond to | |||
1110 | // #2: for each sorted entry, search the original list to find who corresponds | |||
1111 | // #3: for each original entry, find the sorted entry | |||
1112 | // #1 requires extra storage, #2 is slow, #3 can use binary search! | |||
1113 | for (i=0; i < len; ++i) { | |||
1114 | int huff_len = c->sparse ? lengths[values[i]] : lengths[i]; | |||
1115 | if (include_in_sort(c,huff_len)) { | |||
1116 | uint32 code = bit_reverse(c->codewords[i]); | |||
1117 | int x=0, n=c->sorted_entries; | |||
1118 | while (n > 1) { | |||
1119 | // invariant: sc[x] <= code < sc[x+n] | |||
1120 | int m = x + (n >> 1); | |||
1121 | if (c->sorted_codewords[m] <= code) { | |||
1122 | x = m; | |||
1123 | n -= (n>>1); | |||
1124 | } else { | |||
1125 | n >>= 1; | |||
1126 | } | |||
1127 | } | |||
1128 | assert(c->sorted_codewords[x] == code)((c->sorted_codewords[x] == code) ? (void)0 : _assert("c->sorted_codewords[x] == code" , "src/siege/internal/stb/stb_vorbis.c", 1128)); | |||
1129 | if (c->sparse) { | |||
1130 | c->sorted_values[x] = values[i]; | |||
1131 | c->codeword_lengths[x] = huff_len; | |||
1132 | } else { | |||
1133 | c->sorted_values[x] = i; | |||
1134 | } | |||
1135 | } | |||
1136 | } | |||
1137 | } | |||
1138 | ||||
1139 | // only run while parsing the header (3 times) | |||
1140 | static int vorbis_validate(uint8 *data) | |||
1141 | { | |||
1142 | static uint8 vorbis[6] = { 'v', 'o', 'r', 'b', 'i', 's' }; | |||
1143 | return memcmp(data, vorbis, 6) == 0; | |||
1144 | } | |||
1145 | ||||
1146 | // called from setup only, once per code book | |||
1147 | // (formula implied by specification) | |||
1148 | static int lookup1_values(int entries, int dim) | |||
1149 | { | |||
1150 | int r = (int) floor(exp((float) log((float) entries) / dim)); | |||
1151 | if ((int) floor(pow((float) r+1, dim)) <= entries) // (int) cast for MinGW warning; | |||
1152 | ++r; // floor() to avoid _ftol() when non-CRT | |||
1153 | assert(pow((float) r+1, dim) > entries)((pow((float) r+1, dim) > entries) ? (void)0 : _assert("pow((float) r+1, dim) > entries" , "src/siege/internal/stb/stb_vorbis.c", 1153)); | |||
1154 | assert((int) floor(pow((float) r, dim)) <= entries)(((int) floor(pow((float) r, dim)) <= entries) ? (void)0 : _assert("(int) floor(pow((float) r, dim)) <= entries", "src/siege/internal/stb/stb_vorbis.c" , 1154)); // (int),floor() as above | |||
1155 | return r; | |||
1156 | } | |||
1157 | ||||
1158 | // called twice per file | |||
1159 | static void compute_twiddle_factors(int n, float *A, float *B, float *C(2 | 4 | 1)) | |||
1160 | { | |||
1161 | int n4 = n >> 2, n8 = n >> 3; | |||
1162 | int k,k2; | |||
1163 | ||||
1164 | for (k=k2=0; k < n4; ++k,k2+=2) { | |||
1165 | A[k2 ] = (float) cos(4*k*M_PI3.14159265358979323846/n); | |||
1166 | A[k2+1] = (float) -sin(4*k*M_PI3.14159265358979323846/n); | |||
1167 | B[k2 ] = (float) cos((k2+1)*M_PI3.14159265358979323846/n/2) * 0.5f; | |||
1168 | B[k2+1] = (float) sin((k2+1)*M_PI3.14159265358979323846/n/2) * 0.5f; | |||
1169 | } | |||
1170 | for (k=k2=0; k < n8; ++k,k2+=2) { | |||
1171 | C(2 | 4 | 1)[k2 ] = (float) cos(2*(k2+1)*M_PI3.14159265358979323846/n); | |||
1172 | C(2 | 4 | 1)[k2+1] = (float) -sin(2*(k2+1)*M_PI3.14159265358979323846/n); | |||
1173 | } | |||
1174 | } | |||
1175 | ||||
1176 | static void compute_window(int n, float *window) | |||
1177 | { | |||
1178 | int n2 = n >> 1, i; | |||
1179 | for (i=0; i < n2; ++i) | |||
1180 | window[i] = (float) sin(0.5 * M_PI3.14159265358979323846 * square((float) sin((i - 0 + 0.5) / n2 * 0.5 * M_PI3.14159265358979323846))); | |||
1181 | } | |||
1182 | ||||
1183 | static void compute_bitreverse(int n, uint16 *rev) | |||
1184 | { | |||
1185 | int ld = ilog(n) - 1; // ilog is off-by-one from normal definitions | |||
1186 | int i, n8 = n >> 3; | |||
1187 | for (i=0; i < n8; ++i) | |||
1188 | rev[i] = (bit_reverse(i) >> (32-ld+3)) << 2; | |||
1189 | } | |||
1190 | ||||
1191 | static int init_blocksize(vorb *f, int b, int n) | |||
1192 | { | |||
1193 | int n2 = n >> 1, n4 = n >> 2, n8 = n >> 3; | |||
1194 | f->A[b] = (float *) setup_malloc(f, sizeof(float) * n2); | |||
1195 | f->B[b] = (float *) setup_malloc(f, sizeof(float) * n2); | |||
1196 | f->C(2 | 4 | 1)[b] = (float *) setup_malloc(f, sizeof(float) * n4); | |||
1197 | if (!f->A[b] || !f->B[b] || !f->C(2 | 4 | 1)[b]) return error(f, VORBIS_outofmem); | |||
1198 | compute_twiddle_factors(n, f->A[b], f->B[b], f->C(2 | 4 | 1)[b]); | |||
1199 | f->window[b] = (float *) setup_malloc(f, sizeof(float) * n2); | |||
1200 | if (!f->window[b]) return error(f, VORBIS_outofmem); | |||
1201 | compute_window(n, f->window[b]); | |||
1202 | f->bit_reverse[b] = (uint16 *) setup_malloc(f, sizeof(uint16) * n8); | |||
1203 | if (!f->bit_reverse[b]) return error(f, VORBIS_outofmem); | |||
1204 | compute_bitreverse(n, f->bit_reverse[b]); | |||
1205 | return TRUE1; | |||
1206 | } | |||
1207 | ||||
1208 | static void neighbors(uint16 *x, int n, int *plow, int *phigh) | |||
1209 | { | |||
1210 | int low = -1; | |||
1211 | int high = 65536; | |||
1212 | int i; | |||
1213 | for (i=0; i < n; ++i) { | |||
1214 | if (x[i] > low && x[i] < x[n]) { *plow = i; low = x[i]; } | |||
1215 | if (x[i] < high && x[i] > x[n]) { *phigh = i; high = x[i]; } | |||
1216 | } | |||
1217 | } | |||
1218 | ||||
1219 | // this has been repurposed so y is now the original index instead of y | |||
1220 | typedef struct | |||
1221 | { | |||
1222 | uint16 x,y; | |||
1223 | } Point; | |||
1224 | ||||
1225 | int point_compare(const void *p, const void *q) | |||
1226 | { | |||
1227 | Point *a = (Point *) p; | |||
1228 | Point *b = (Point *) q; | |||
1229 | return a->x < b->x ? -1 : a->x > b->x; | |||
1230 | } | |||
1231 | ||||
1232 | // | |||
1233 | /////////////////////// END LEAF SETUP FUNCTIONS ////////////////////////// | |||
1234 | ||||
1235 | ||||
1236 | #if defined(STB_VORBIS_NO_STDIO) | |||
1237 | #define USE_MEMORY(z)((z)->stream) TRUE1 | |||
1238 | #else | |||
1239 | #define USE_MEMORY(z)((z)->stream) ((z)->stream) | |||
1240 | #endif | |||
1241 | ||||
1242 | static uint8 get8(vorb *z) | |||
1243 | { | |||
1244 | if (USE_MEMORY(z)((z)->stream)) { | |||
1245 | if (z->stream >= z->stream_end) { z->eof = TRUE1; return 0; } | |||
1246 | return *z->stream++; | |||
1247 | } | |||
1248 | ||||
1249 | #ifndef STB_VORBIS_NO_STDIO | |||
1250 | { | |||
1251 | int c = fgetc(z->f); | |||
1252 | if (c == EOF(-1)) { z->eof = TRUE1; return 0; } | |||
1253 | return c; | |||
1254 | } | |||
1255 | #endif | |||
1256 | } | |||
1257 | ||||
1258 | static uint32 get32(vorb *f) | |||
1259 | { | |||
1260 | uint32 x; | |||
1261 | x = get8(f); | |||
1262 | x += get8(f) << 8; | |||
1263 | x += get8(f) << 16; | |||
1264 | x += get8(f) << 24; | |||
1265 | return x; | |||
1266 | } | |||
1267 | ||||
1268 | static int getn(vorb *z, uint8 *data, int n) | |||
1269 | { | |||
1270 | if (USE_MEMORY(z)((z)->stream)) { | |||
1271 | if (z->stream+n > z->stream_end) { z->eof = 1; return 0; } | |||
1272 | memcpy(data, z->stream, n); | |||
1273 | z->stream += n; | |||
1274 | return 1; | |||
1275 | } | |||
1276 | ||||
1277 | #ifndef STB_VORBIS_NO_STDIO | |||
1278 | if (fread(data, n, 1, z->f) == 1) | |||
1279 | return 1; | |||
1280 | else { | |||
1281 | z->eof = 1; | |||
1282 | return 0; | |||
1283 | } | |||
1284 | #endif | |||
1285 | } | |||
1286 | ||||
1287 | static void skip(vorb *z, int n) | |||
1288 | { | |||
1289 | if (USE_MEMORY(z)((z)->stream)) { | |||
1290 | z->stream += n; | |||
1291 | if (z->stream >= z->stream_end) z->eof = 1; | |||
1292 | return; | |||
1293 | } | |||
1294 | #ifndef STB_VORBIS_NO_STDIO | |||
1295 | { | |||
1296 | long x = ftell(z->f); | |||
1297 | fseek(z->f, x+n, SEEK_SET0); | |||
1298 | } | |||
1299 | #endif | |||
1300 | } | |||
1301 | ||||
1302 | static int set_file_offset(stb_vorbis *f, unsigned int loc) | |||
1303 | { | |||
1304 | #ifndef STB_VORBIS_NO_PUSHDATA_API | |||
1305 | if (f->push_mode) return 0; | |||
1306 | #endif | |||
1307 | f->eof = 0; | |||
1308 | if (USE_MEMORY(f)((f)->stream)) { | |||
1309 | if (f->stream_start + loc >= f->stream_end || f->stream_start + loc < f->stream_start) { | |||
1310 | f->stream = f->stream_end; | |||
1311 | f->eof = 1; | |||
1312 | return 0; | |||
1313 | } else { | |||
1314 | f->stream = f->stream_start + loc; | |||
1315 | return 1; | |||
1316 | } | |||
1317 | } | |||
1318 | #ifndef STB_VORBIS_NO_STDIO | |||
1319 | if (loc + f->f_start < loc || loc >= 0x80000000) { | |||
1320 | loc = 0x7fffffff; | |||
1321 | f->eof = 1; | |||
1322 | } else { | |||
1323 | loc += f->f_start; | |||
1324 | } | |||
1325 | if (!fseek(f->f, loc, SEEK_SET0)) | |||
1326 | return 1; | |||
1327 | f->eof = 1; | |||
1328 | fseek(f->f, f->f_start, SEEK_END2); | |||
1329 | return 0; | |||
1330 | #endif | |||
1331 | } | |||
1332 | ||||
1333 | ||||
1334 | static uint8 ogg_page_header[4] = { 0x4f, 0x67, 0x67, 0x53 }; | |||
1335 | ||||
1336 | static int capture_pattern(vorb *f) | |||
1337 | { | |||
1338 | if (0x4f != get8(f)) return FALSE0; | |||
1339 | if (0x67 != get8(f)) return FALSE0; | |||
1340 | if (0x67 != get8(f)) return FALSE0; | |||
1341 | if (0x53 != get8(f)) return FALSE0; | |||
1342 | return TRUE1; | |||
1343 | } | |||
1344 | ||||
1345 | #define PAGEFLAG_continued_packet1 1 | |||
1346 | #define PAGEFLAG_first_page2 2 | |||
1347 | #define PAGEFLAG_last_page4 4 | |||
1348 | ||||
1349 | static int start_page_no_capturepattern(vorb *f) | |||
1350 | { | |||
1351 | uint32 loc0,loc1,n; | |||
1352 | int32 i; | |||
1353 | // stream structure version | |||
1354 | if (0 != get8(f)) return error(f, VORBIS_invalid_stream_structure_version); | |||
1355 | // header flag | |||
1356 | f->page_flag = get8(f); | |||
1357 | // absolute granule position | |||
1358 | loc0 = get32(f); | |||
1359 | loc1 = get32(f); | |||
1360 | // @TODO: validate loc0,loc1 as valid positions? | |||
1361 | // stream serial number -- vorbis doesn't interleave, so discard | |||
1362 | get32(f); | |||
1363 | //if (f->serial != get32(f)) return error(f, VORBIS_incorrect_stream_serial_number); | |||
1364 | // page sequence number | |||
1365 | n = get32(f); | |||
1366 | f->last_page = n; | |||
1367 | // CRC32 | |||
1368 | get32(f); | |||
1369 | // page_segments | |||
1370 | f->segment_count = get8(f); | |||
1371 | if (!getn(f, f->segments, f->segment_count)) | |||
1372 | return error(f, VORBIS_unexpected_eof); | |||
1373 | // assume we _don't_ know any the sample position of any segments | |||
1374 | f->end_seg_with_known_loc = -2; | |||
1375 | if (loc0 != ~0 || loc1 != ~0) { | |||
1376 | // determine which packet is the last one that will complete | |||
1377 | for (i=f->segment_count-1; i >= 0; --i) | |||
1378 | if (f->segments[i] < 255) | |||
1379 | break; | |||
1380 | // 'i' is now the index of the _last_ segment of a packet that ends | |||
1381 | if (i >= 0) { | |||
1382 | f->end_seg_with_known_loc = i; | |||
1383 | f->known_loc_for_packet = loc0; | |||
1384 | } | |||
1385 | } | |||
1386 | if (f->first_decode) { | |||
1387 | int i,len; | |||
1388 | ProbedPage p; | |||
1389 | len = 0; | |||
1390 | for (i=0; i < f->segment_count; ++i) | |||
1391 | len += f->segments[i]; | |||
1392 | len += 27 + f->segment_count; | |||
1393 | p.page_start = f->first_audio_page_offset; | |||
1394 | p.page_end = p.page_start + len; | |||
1395 | p.after_previous_page_start = p.page_start; | |||
1396 | p.first_decoded_sample = 0; | |||
1397 | p.last_decoded_sample = loc0; | |||
1398 | f->p_first = p; | |||
1399 | } | |||
1400 | f->next_seg = 0; | |||
1401 | return TRUE1; | |||
1402 | } | |||
1403 | ||||
1404 | static int start_page(vorb *f) | |||
1405 | { | |||
1406 | if (!capture_pattern(f)) return error(f, VORBIS_missing_capture_pattern); | |||
1407 | return start_page_no_capturepattern(f); | |||
1408 | } | |||
1409 | ||||
1410 | static int start_packet(vorb *f) | |||
1411 | { | |||
1412 | while (f->next_seg == -1) { | |||
1413 | if (!start_page(f)) return FALSE0; | |||
1414 | if (f->page_flag & PAGEFLAG_continued_packet1) | |||
1415 | return error(f, VORBIS_continued_packet_flag_invalid); | |||
1416 | } | |||
1417 | f->last_seg = FALSE0; | |||
1418 | f->valid_bits = 0; | |||
1419 | f->packet_bytes = 0; | |||
1420 | f->bytes_in_seg = 0; | |||
1421 | // f->next_seg is now valid | |||
1422 | return TRUE1; | |||
1423 | } | |||
1424 | ||||
1425 | static int maybe_start_packet(vorb *f) | |||
1426 | { | |||
1427 | if (f->next_seg == -1) { | |||
1428 | int x = get8(f); | |||
1429 | if (f->eof) return FALSE0; // EOF at page boundary is not an error! | |||
1430 | if (0x4f != x ) return error(f, VORBIS_missing_capture_pattern); | |||
1431 | if (0x67 != get8(f)) return error(f, VORBIS_missing_capture_pattern); | |||
1432 | if (0x67 != get8(f)) return error(f, VORBIS_missing_capture_pattern); | |||
1433 | if (0x53 != get8(f)) return error(f, VORBIS_missing_capture_pattern); | |||
1434 | if (!start_page_no_capturepattern(f)) return FALSE0; | |||
1435 | if (f->page_flag & PAGEFLAG_continued_packet1) { | |||
1436 | // set up enough state that we can read this packet if we want, | |||
1437 | // e.g. during recovery | |||
1438 | f->last_seg = FALSE0; | |||
1439 | f->bytes_in_seg = 0; | |||
1440 | return error(f, VORBIS_continued_packet_flag_invalid); | |||
1441 | } | |||
1442 | } | |||
1443 | return start_packet(f); | |||
1444 | } | |||
1445 | ||||
1446 | static int next_segment(vorb *f) | |||
1447 | { | |||
1448 | int len; | |||
1449 | if (f->last_seg) return 0; | |||
1450 | if (f->next_seg == -1) { | |||
1451 | f->last_seg_which = f->segment_count-1; // in case start_page fails | |||
1452 | if (!start_page(f)) { f->last_seg = 1; return 0; } | |||
1453 | if (!(f->page_flag & PAGEFLAG_continued_packet1)) return error(f, VORBIS_continued_packet_flag_invalid); | |||
1454 | } | |||
1455 | len = f->segments[f->next_seg++]; | |||
1456 | if (len < 255) { | |||
1457 | f->last_seg = TRUE1; | |||
1458 | f->last_seg_which = f->next_seg-1; | |||
1459 | } | |||
1460 | if (f->next_seg >= f->segment_count) | |||
1461 | f->next_seg = -1; | |||
1462 | assert(f->bytes_in_seg == 0)((f->bytes_in_seg == 0) ? (void)0 : _assert("f->bytes_in_seg == 0" , "src/siege/internal/stb/stb_vorbis.c", 1462)); | |||
1463 | f->bytes_in_seg = len; | |||
1464 | return len; | |||
1465 | } | |||
1466 | ||||
1467 | #define EOP(-1) (-1) | |||
1468 | #define INVALID_BITS(-1) (-1) | |||
1469 | ||||
1470 | static int get8_packet_raw(vorb *f) | |||
1471 | { | |||
1472 | if (!f->bytes_in_seg) | |||
1473 | { | |||
1474 | if (f->last_seg) return EOP(-1); | |||
1475 | else if (!next_segment(f)) return EOP(-1); | |||
1476 | } | |||
1477 | assert(f->bytes_in_seg > 0)((f->bytes_in_seg > 0) ? (void)0 : _assert("f->bytes_in_seg > 0" , "src/siege/internal/stb/stb_vorbis.c", 1477)); | |||
1478 | --f->bytes_in_seg; | |||
1479 | ++f->packet_bytes; | |||
1480 | return get8(f); | |||
1481 | } | |||
1482 | ||||
1483 | static int get8_packet(vorb *f) | |||
1484 | { | |||
1485 | int x = get8_packet_raw(f); | |||
1486 | f->valid_bits = 0; | |||
1487 | return x; | |||
1488 | } | |||
1489 | ||||
1490 | static void flush_packet(vorb *f) | |||
1491 | { | |||
1492 | while (get8_packet_raw(f) != EOP(-1)); | |||
1493 | } | |||
1494 | ||||
1495 | // @OPTIMIZE: this is the secondary bit decoder, so it's probably not as important | |||
1496 | // as the huffman decoder? | |||
1497 | static uint32 get_bits(vorb *f, int n) | |||
1498 | { | |||
1499 | uint32 z; | |||
1500 | ||||
1501 | if (f->valid_bits < 0) return 0; | |||
1502 | if (f->valid_bits < n) { | |||
1503 | if (n > 24) { | |||
1504 | // the accumulator technique below would not work correctly in this case | |||
1505 | z = get_bits(f, 24); | |||
1506 | z += get_bits(f, n-24) << 24; | |||
1507 | return z; | |||
1508 | } | |||
1509 | if (f->valid_bits == 0) f->acc = 0; | |||
1510 | while (f->valid_bits < n) { | |||
1511 | int z = get8_packet_raw(f); | |||
1512 | if (z == EOP(-1)) { | |||
1513 | f->valid_bits = INVALID_BITS(-1); | |||
1514 | return 0; | |||
1515 | } | |||
1516 | f->acc += z << f->valid_bits; | |||
1517 | f->valid_bits += 8; | |||
1518 | } | |||
1519 | } | |||
1520 | if (f->valid_bits < 0) return 0; | |||
1521 | z = f->acc & ((1 << n)-1); | |||
1522 | f->acc >>= n; | |||
1523 | f->valid_bits -= n; | |||
1524 | return z; | |||
1525 | } | |||
1526 | ||||
1527 | static int32 get_bits_signed(vorb *f, int n) | |||
1528 | { | |||
1529 | uint32 z = get_bits(f, n); | |||
1530 | if (z & (1 << (n-1))) | |||
1531 | z += ~((1 << n) - 1); | |||
1532 | return (int32) z; | |||
1533 | } | |||
1534 | ||||
1535 | // @OPTIMIZE: primary accumulator for huffman | |||
1536 | // expand the buffer to as many bits as possible without reading off end of packet | |||
1537 | // it might be nice to allow f->valid_bits and f->acc to be stored in registers, | |||
1538 | // e.g. cache them locally and decode locally | |||
1539 | static __forceinlineinline void prep_huffman(vorb *f) | |||
1540 | { | |||
1541 | if (f->valid_bits <= 24) { | |||
1542 | if (f->valid_bits == 0) f->acc = 0; | |||
1543 | do { | |||
1544 | int z; | |||
1545 | if (f->last_seg && !f->bytes_in_seg) return; | |||
1546 | z = get8_packet_raw(f); | |||
1547 | if (z == EOP(-1)) return; | |||
1548 | f->acc += z << f->valid_bits; | |||
1549 | f->valid_bits += 8; | |||
1550 | } while (f->valid_bits <= 24); | |||
1551 | } | |||
1552 | } | |||
1553 | ||||
1554 | enum | |||
1555 | { | |||
1556 | VORBIS_packet_id = 1, | |||
1557 | VORBIS_packet_comment = 3, | |||
1558 | VORBIS_packet_setup = 5, | |||
1559 | }; | |||
1560 | ||||
1561 | static int codebook_decode_scalar_raw(vorb *f, Codebook *c) | |||
1562 | { | |||
1563 | int i; | |||
1564 | prep_huffman(f); | |||
1565 | ||||
1566 | assert(c->sorted_codewords || c->codewords)((c->sorted_codewords || c->codewords) ? (void)0 : _assert ("c->sorted_codewords || c->codewords", "src/siege/internal/stb/stb_vorbis.c" , 1566)); | |||
1567 | // cases to use binary search: sorted_codewords && !c->codewords | |||
1568 | // sorted_codewords && c->entries > 8 | |||
1569 | if (c->entries > 8 ? c->sorted_codewords!=NULL((void*)0) : !c->codewords) { | |||
1570 | // binary search | |||
1571 | uint32 code = bit_reverse(f->acc); | |||
1572 | int x=0, n=c->sorted_entries, len; | |||
1573 | ||||
1574 | while (n > 1) { | |||
1575 | // invariant: sc[x] <= code < sc[x+n] | |||
1576 | int m = x + (n >> 1); | |||
1577 | if (c->sorted_codewords[m] <= code) { | |||
1578 | x = m; | |||
1579 | n -= (n>>1); | |||
1580 | } else { | |||
1581 | n >>= 1; | |||
1582 | } | |||
1583 | } | |||
1584 | // x is now the sorted index | |||
1585 | if (!c->sparse) x = c->sorted_values[x]; | |||
1586 | // x is now sorted index if sparse, or symbol otherwise | |||
1587 | len = c->codeword_lengths[x]; | |||
1588 | if (f->valid_bits >= len) { | |||
1589 | f->acc >>= len; | |||
1590 | f->valid_bits -= len; | |||
1591 | return x; | |||
1592 | } | |||
1593 | ||||
1594 | f->valid_bits = 0; | |||
1595 | return -1; | |||
1596 | } | |||
1597 | ||||
1598 | // if small, linear search | |||
1599 | assert(!c->sparse)((!c->sparse) ? (void)0 : _assert("!c->sparse", "src/siege/internal/stb/stb_vorbis.c" , 1599)); | |||
1600 | for (i=0; i < c->entries; ++i) { | |||
1601 | if (c->codeword_lengths[i] == NO_CODE255) continue; | |||
1602 | if (c->codewords[i] == (f->acc & ((1 << c->codeword_lengths[i])-1))) { | |||
1603 | if (f->valid_bits >= c->codeword_lengths[i]) { | |||
1604 | f->acc >>= c->codeword_lengths[i]; | |||
1605 | f->valid_bits -= c->codeword_lengths[i]; | |||
1606 | return i; | |||
1607 | } | |||
1608 | f->valid_bits = 0; | |||
1609 | return -1; | |||
1610 | } | |||
1611 | } | |||
1612 | ||||
1613 | error(f, VORBIS_invalid_stream); | |||
1614 | f->valid_bits = 0; | |||
1615 | return -1; | |||
1616 | } | |||
1617 | ||||
1618 | static int codebook_decode_scalar(vorb *f, Codebook *c) | |||
1619 | { | |||
1620 | int i; | |||
1621 | if (f->valid_bits < STB_VORBIS_FAST_HUFFMAN_LENGTH10) | |||
1622 | prep_huffman(f); | |||
1623 | // fast huffman table lookup | |||
1624 | i = f->acc & FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1); | |||
1625 | i = c->fast_huffman[i]; | |||
1626 | if (i >= 0) { | |||
1627 | f->acc >>= c->codeword_lengths[i]; | |||
1628 | f->valid_bits -= c->codeword_lengths[i]; | |||
1629 | if (f->valid_bits < 0) { f->valid_bits = 0; return -1; } | |||
1630 | return i; | |||
1631 | } | |||
1632 | return codebook_decode_scalar_raw(f,c); | |||
1633 | } | |||
1634 | ||||
1635 | #ifndef STB_VORBIS_NO_INLINE_DECODE | |||
1636 | ||||
1637 | #define DECODE_RAW(var, f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } \ | |||
1638 | if (f->valid_bits < STB_VORBIS_FAST_HUFFMAN_LENGTH10) \ | |||
1639 | prep_huffman(f); \ | |||
1640 | var = f->acc & FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1); \ | |||
1641 | var = c->fast_huffman[var]; \ | |||
1642 | if (var >= 0) { \ | |||
1643 | int n = c->codeword_lengths[var]; \ | |||
1644 | f->acc >>= n; \ | |||
1645 | f->valid_bits -= n; \ | |||
1646 | if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } \ | |||
1647 | } else { \ | |||
1648 | var = codebook_decode_scalar_raw(f,c); \ | |||
1649 | } | |||
1650 | ||||
1651 | #else | |||
1652 | ||||
1653 | #define DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } var = codebook_decode_scalar(f,c); | |||
1654 | ||||
1655 | #endif | |||
1656 | ||||
1657 | #define DECODE(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } if (c->sparse) var = c->sorted_values[var]; \ | |||
1658 | DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } \ | |||
1659 | if (c->sparse) var = c->sorted_values[var]; | |||
1660 | ||||
1661 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
1662 | #define DECODE_VQ(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } | |||
1663 | #else | |||
1664 | #define DECODE_VQ(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } DECODE(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } if (c->sparse) var = c->sorted_values[var]; | |||
1665 | #endif | |||
1666 | ||||
1667 | ||||
1668 | ||||
1669 | ||||
1670 | ||||
1671 | ||||
1672 | // CODEBOOK_ELEMENT_FAST is an optimization for the CODEBOOK_FLOATS case | |||
1673 | // where we avoid one addition | |||
1674 | #ifndef STB_VORBIS_CODEBOOK_FLOATS | |||
1675 | #define CODEBOOK_ELEMENT(c,off)(c->multiplicands[off]) (c->multiplicands[off] * c->delta_value + c->minimum_value) | |||
1676 | #define CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) (c->multiplicands[off] * c->delta_value) | |||
1677 | #define CODEBOOK_ELEMENT_BASE(c)(0) (c->minimum_value) | |||
1678 | #else | |||
1679 | #define CODEBOOK_ELEMENT(c,off)(c->multiplicands[off]) (c->multiplicands[off]) | |||
1680 | #define CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) (c->multiplicands[off]) | |||
1681 | #define CODEBOOK_ELEMENT_BASE(c)(0) (0) | |||
1682 | #endif | |||
1683 | ||||
1684 | static int codebook_decode_start(vorb *f, Codebook *c, int len) | |||
1685 | { | |||
1686 | int z = -1; | |||
1687 | ||||
1688 | // type 0 is only legal in a scalar context | |||
1689 | if (c->lookup_type == 0) | |||
1690 | error(f, VORBIS_invalid_stream); | |||
1691 | else { | |||
1692 | DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); }; | |||
1693 | if (c->sparse) assert(z < c->sorted_entries)((z < c->sorted_entries) ? (void)0 : _assert("z < c->sorted_entries" , "src/siege/internal/stb/stb_vorbis.c", 1693)); | |||
1694 | if (z < 0) { // check for EOP | |||
1695 | if (!f->bytes_in_seg) | |||
1696 | if (f->last_seg) | |||
1697 | return z; | |||
1698 | error(f, VORBIS_invalid_stream); | |||
1699 | } | |||
1700 | } | |||
1701 | return z; | |||
1702 | } | |||
1703 | ||||
1704 | static int codebook_decode(vorb *f, Codebook *c, float *output, int len) | |||
1705 | { | |||
1706 | int i,z = codebook_decode_start(f,c,len); | |||
1707 | if (z < 0) return FALSE0; | |||
1708 | if (len > c->dimensions) len = c->dimensions; | |||
1709 | ||||
1710 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
1711 | if (c->lookup_type == 1) { | |||
1712 | float last = CODEBOOK_ELEMENT_BASE(c)(0); | |||
1713 | int div = 1; | |||
1714 | for (i=0; i < len; ++i) { | |||
1715 | int off = (z / div) % c->lookup_values; | |||
1716 | float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last; | |||
1717 | output[i] += val; | |||
1718 | if (c->sequence_p) last = val + c->minimum_value; | |||
1719 | div *= c->lookup_values; | |||
1720 | } | |||
1721 | return TRUE1; | |||
1722 | } | |||
1723 | #endif | |||
1724 | ||||
1725 | z *= c->dimensions; | |||
1726 | if (c->sequence_p) { | |||
1727 | float last = CODEBOOK_ELEMENT_BASE(c)(0); | |||
1728 | for (i=0; i < len; ++i) { | |||
1729 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1730 | output[i] += val; | |||
1731 | last = val + c->minimum_value; | |||
1732 | } | |||
1733 | } else { | |||
1734 | float last = CODEBOOK_ELEMENT_BASE(c)(0); | |||
1735 | for (i=0; i < len; ++i) { | |||
1736 | output[i] += CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1737 | } | |||
1738 | } | |||
1739 | ||||
1740 | return TRUE1; | |||
1741 | } | |||
1742 | ||||
1743 | static int codebook_decode_step(vorb *f, Codebook *c, float *output, int len, int step) | |||
1744 | { | |||
1745 | int i,z = codebook_decode_start(f,c,len); | |||
1746 | float last = CODEBOOK_ELEMENT_BASE(c)(0); | |||
1747 | if (z < 0) return FALSE0; | |||
1748 | if (len > c->dimensions) len = c->dimensions; | |||
1749 | ||||
1750 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
1751 | if (c->lookup_type == 1) { | |||
1752 | int div = 1; | |||
1753 | for (i=0; i < len; ++i) { | |||
1754 | int off = (z / div) % c->lookup_values; | |||
1755 | float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last; | |||
1756 | output[i*step] += val; | |||
1757 | if (c->sequence_p) last = val; | |||
1758 | div *= c->lookup_values; | |||
1759 | } | |||
1760 | return TRUE1; | |||
1761 | } | |||
1762 | #endif | |||
1763 | ||||
1764 | z *= c->dimensions; | |||
1765 | for (i=0; i < len; ++i) { | |||
1766 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1767 | output[i*step] += val; | |||
1768 | if (c->sequence_p) last = val; | |||
1769 | } | |||
1770 | ||||
1771 | return TRUE1; | |||
1772 | } | |||
1773 | ||||
1774 | static int codebook_decode_deinterleave_repeat(vorb *f, Codebook *c, float **outputs, int ch, int *c_inter_p, int *p_inter_p, int len, int total_decode) | |||
1775 | { | |||
1776 | int c_inter = *c_inter_p; | |||
1777 | int p_inter = *p_inter_p; | |||
1778 | int i,z, effective = c->dimensions; | |||
1779 | ||||
1780 | // type 0 is only legal in a scalar context | |||
1781 | if (c->lookup_type == 0) return error(f, VORBIS_invalid_stream); | |||
1782 | ||||
1783 | while (total_decode > 0) { | |||
1784 | float last = CODEBOOK_ELEMENT_BASE(c)(0); | |||
1785 | DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); }; | |||
1786 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
1787 | assert(!c->sparse || z < c->sorted_entries)((!c->sparse || z < c->sorted_entries) ? (void)0 : _assert ("!c->sparse || z < c->sorted_entries", "src/siege/internal/stb/stb_vorbis.c" , 1787)); | |||
1788 | #endif | |||
1789 | if (z < 0) { | |||
1790 | if (!f->bytes_in_seg) | |||
1791 | if (f->last_seg) return FALSE0; | |||
1792 | return error(f, VORBIS_invalid_stream); | |||
1793 | } | |||
1794 | ||||
1795 | // if this will take us off the end of the buffers, stop short! | |||
1796 | // we check by computing the length of the virtual interleaved | |||
1797 | // buffer (len*ch), our current offset within it (p_inter*ch)+(c_inter), | |||
1798 | // and the length we'll be using (effective) | |||
1799 | if (c_inter + p_inter*ch + effective > len * ch) { | |||
1800 | effective = len*ch - (p_inter*ch - c_inter); | |||
1801 | } | |||
1802 | ||||
1803 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
1804 | if (c->lookup_type == 1) { | |||
1805 | int div = 1; | |||
1806 | for (i=0; i < effective; ++i) { | |||
1807 | int off = (z / div) % c->lookup_values; | |||
1808 | float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last; | |||
1809 | outputs[c_inter][p_inter] += val; | |||
1810 | if (++c_inter == ch) { c_inter = 0; ++p_inter; } | |||
1811 | if (c->sequence_p) last = val; | |||
1812 | div *= c->lookup_values; | |||
1813 | } | |||
1814 | } else | |||
1815 | #endif | |||
1816 | { | |||
1817 | z *= c->dimensions; | |||
1818 | if (c->sequence_p) { | |||
1819 | for (i=0; i < effective; ++i) { | |||
1820 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1821 | outputs[c_inter][p_inter] += val; | |||
1822 | if (++c_inter == ch) { c_inter = 0; ++p_inter; } | |||
1823 | last = val; | |||
1824 | } | |||
1825 | } else { | |||
1826 | for (i=0; i < effective; ++i) { | |||
1827 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1828 | outputs[c_inter][p_inter] += val; | |||
1829 | if (++c_inter == ch) { c_inter = 0; ++p_inter; } | |||
1830 | } | |||
1831 | } | |||
1832 | } | |||
1833 | ||||
1834 | total_decode -= effective; | |||
1835 | } | |||
1836 | *c_inter_p = c_inter; | |||
1837 | *p_inter_p = p_inter; | |||
1838 | return TRUE1; | |||
1839 | } | |||
1840 | ||||
1841 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
1842 | static int codebook_decode_deinterleave_repeat_2(vorb *f, Codebook *c, float **outputs, int *c_inter_p, int *p_inter_p, int len, int total_decode) | |||
1843 | { | |||
1844 | int c_inter = *c_inter_p; | |||
1845 | int p_inter = *p_inter_p; | |||
1846 | int i,z, effective = c->dimensions; | |||
1847 | ||||
1848 | // type 0 is only legal in a scalar context | |||
1849 | if (c->lookup_type == 0) return error(f, VORBIS_invalid_stream); | |||
1850 | ||||
1851 | while (total_decode > 0) { | |||
1852 | float last = CODEBOOK_ELEMENT_BASE(c)(0); | |||
1853 | DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); }; | |||
1854 | ||||
1855 | if (z < 0) { | |||
1856 | if (!f->bytes_in_seg) | |||
1857 | if (f->last_seg) return FALSE0; | |||
1858 | return error(f, VORBIS_invalid_stream); | |||
1859 | } | |||
1860 | ||||
1861 | // if this will take us off the end of the buffers, stop short! | |||
1862 | // we check by computing the length of the virtual interleaved | |||
1863 | // buffer (len*ch), our current offset within it (p_inter*ch)+(c_inter), | |||
1864 | // and the length we'll be using (effective) | |||
1865 | if (c_inter + p_inter*2 + effective > len * 2) { | |||
1866 | effective = len*2 - (p_inter*2 - c_inter); | |||
1867 | } | |||
1868 | ||||
1869 | { | |||
1870 | z *= c->dimensions; | |||
1871 | stb_prof(11)(void)0; | |||
1872 | if (c->sequence_p) { | |||
1873 | // haven't optimized this case because I don't have any examples | |||
1874 | for (i=0; i < effective; ++i) { | |||
1875 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1876 | outputs[c_inter][p_inter] += val; | |||
1877 | if (++c_inter == 2) { c_inter = 0; ++p_inter; } | |||
1878 | last = val; | |||
1879 | } | |||
1880 | } else { | |||
1881 | i=0; | |||
1882 | if (c_inter == 1) { | |||
1883 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1884 | outputs[c_inter][p_inter] += val; | |||
1885 | c_inter = 0; ++p_inter; | |||
1886 | ++i; | |||
1887 | } | |||
1888 | { | |||
1889 | float *z0 = outputs[0]; | |||
1890 | float *z1 = outputs[1]; | |||
1891 | for (; i+1 < effective;) { | |||
1892 | z0[p_inter] += CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1893 | z1[p_inter] += CODEBOOK_ELEMENT_FAST(c,z+i+1)(c->multiplicands[z+i+1]) + last; | |||
1894 | ++p_inter; | |||
1895 | i += 2; | |||
1896 | } | |||
1897 | } | |||
1898 | if (i < effective) { | |||
1899 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; | |||
1900 | outputs[c_inter][p_inter] += val; | |||
1901 | if (++c_inter == 2) { c_inter = 0; ++p_inter; } | |||
1902 | } | |||
1903 | } | |||
1904 | } | |||
1905 | ||||
1906 | total_decode -= effective; | |||
1907 | } | |||
1908 | *c_inter_p = c_inter; | |||
1909 | *p_inter_p = p_inter; | |||
1910 | return TRUE1; | |||
1911 | } | |||
1912 | #endif | |||
1913 | ||||
1914 | static int predict_point(int x, int x0, int x1, int y0, int y1) | |||
1915 | { | |||
1916 | int dy = y1 - y0; | |||
1917 | int adx = x1 - x0; | |||
1918 | // @OPTIMIZE: force int division to round in the right direction... is this necessary on x86? | |||
1919 | int err = abs(dy) * (x - x0); | |||
1920 | int off = err / adx; | |||
1921 | return dy < 0 ? y0 - off : y0 + off; | |||
1922 | } | |||
1923 | ||||
1924 | // the following table is block-copied from the specification | |||
1925 | static float inverse_db_table[256] = | |||
1926 | { | |||
1927 | 1.0649863e-07f, 1.1341951e-07f, 1.2079015e-07f, 1.2863978e-07f, | |||
1928 | 1.3699951e-07f, 1.4590251e-07f, 1.5538408e-07f, 1.6548181e-07f, | |||
1929 | 1.7623575e-07f, 1.8768855e-07f, 1.9988561e-07f, 2.1287530e-07f, | |||
1930 | 2.2670913e-07f, 2.4144197e-07f, 2.5713223e-07f, 2.7384213e-07f, | |||
1931 | 2.9163793e-07f, 3.1059021e-07f, 3.3077411e-07f, 3.5226968e-07f, | |||
1932 | 3.7516214e-07f, 3.9954229e-07f, 4.2550680e-07f, 4.5315863e-07f, | |||
1933 | 4.8260743e-07f, 5.1396998e-07f, 5.4737065e-07f, 5.8294187e-07f, | |||
1934 | 6.2082472e-07f, 6.6116941e-07f, 7.0413592e-07f, 7.4989464e-07f, | |||
1935 | 7.9862701e-07f, 8.5052630e-07f, 9.0579828e-07f, 9.6466216e-07f, | |||
1936 | 1.0273513e-06f, 1.0941144e-06f, 1.1652161e-06f, 1.2409384e-06f, | |||
1937 | 1.3215816e-06f, 1.4074654e-06f, 1.4989305e-06f, 1.5963394e-06f, | |||
1938 | 1.7000785e-06f, 1.8105592e-06f, 1.9282195e-06f, 2.0535261e-06f, | |||
1939 | 2.1869758e-06f, 2.3290978e-06f, 2.4804557e-06f, 2.6416497e-06f, | |||
1940 | 2.8133190e-06f, 2.9961443e-06f, 3.1908506e-06f, 3.3982101e-06f, | |||
1941 | 3.6190449e-06f, 3.8542308e-06f, 4.1047004e-06f, 4.3714470e-06f, | |||
1942 | 4.6555282e-06f, 4.9580707e-06f, 5.2802740e-06f, 5.6234160e-06f, | |||
1943 | 5.9888572e-06f, 6.3780469e-06f, 6.7925283e-06f, 7.2339451e-06f, | |||
1944 | 7.7040476e-06f, 8.2047000e-06f, 8.7378876e-06f, 9.3057248e-06f, | |||
1945 | 9.9104632e-06f, 1.0554501e-05f, 1.1240392e-05f, 1.1970856e-05f, | |||
1946 | 1.2748789e-05f, 1.3577278e-05f, 1.4459606e-05f, 1.5399272e-05f, | |||
1947 | 1.6400004e-05f, 1.7465768e-05f, 1.8600792e-05f, 1.9809576e-05f, | |||
1948 | 2.1096914e-05f, 2.2467911e-05f, 2.3928002e-05f, 2.5482978e-05f, | |||
1949 | 2.7139006e-05f, 2.8902651e-05f, 3.0780908e-05f, 3.2781225e-05f, | |||
1950 | 3.4911534e-05f, 3.7180282e-05f, 3.9596466e-05f, 4.2169667e-05f, | |||
1951 | 4.4910090e-05f, 4.7828601e-05f, 5.0936773e-05f, 5.4246931e-05f, | |||
1952 | 5.7772202e-05f, 6.1526565e-05f, 6.5524908e-05f, 6.9783085e-05f, | |||
1953 | 7.4317983e-05f, 7.9147585e-05f, 8.4291040e-05f, 8.9768747e-05f, | |||
1954 | 9.5602426e-05f, 0.00010181521f, 0.00010843174f, 0.00011547824f, | |||
1955 | 0.00012298267f, 0.00013097477f, 0.00013948625f, 0.00014855085f, | |||
1956 | 0.00015820453f, 0.00016848555f, 0.00017943469f, 0.00019109536f, | |||
1957 | 0.00020351382f, 0.00021673929f, 0.00023082423f, 0.00024582449f, | |||
1958 | 0.00026179955f, 0.00027881276f, 0.00029693158f, 0.00031622787f, | |||
1959 | 0.00033677814f, 0.00035866388f, 0.00038197188f, 0.00040679456f, | |||
1960 | 0.00043323036f, 0.00046138411f, 0.00049136745f, 0.00052329927f, | |||
1961 | 0.00055730621f, 0.00059352311f, 0.00063209358f, 0.00067317058f, | |||
1962 | 0.00071691700f, 0.00076350630f, 0.00081312324f, 0.00086596457f, | |||
1963 | 0.00092223983f, 0.00098217216f, 0.0010459992f, 0.0011139742f, | |||
1964 | 0.0011863665f, 0.0012634633f, 0.0013455702f, 0.0014330129f, | |||
1965 | 0.0015261382f, 0.0016253153f, 0.0017309374f, 0.0018434235f, | |||
1966 | 0.0019632195f, 0.0020908006f, 0.0022266726f, 0.0023713743f, | |||
1967 | 0.0025254795f, 0.0026895994f, 0.0028643847f, 0.0030505286f, | |||
1968 | 0.0032487691f, 0.0034598925f, 0.0036847358f, 0.0039241906f, | |||
1969 | 0.0041792066f, 0.0044507950f, 0.0047400328f, 0.0050480668f, | |||
1970 | 0.0053761186f, 0.0057254891f, 0.0060975636f, 0.0064938176f, | |||
1971 | 0.0069158225f, 0.0073652516f, 0.0078438871f, 0.0083536271f, | |||
1972 | 0.0088964928f, 0.009474637f, 0.010090352f, 0.010746080f, | |||
1973 | 0.011444421f, 0.012188144f, 0.012980198f, 0.013823725f, | |||
1974 | 0.014722068f, 0.015678791f, 0.016697687f, 0.017782797f, | |||
1975 | 0.018938423f, 0.020169149f, 0.021479854f, 0.022875735f, | |||
1976 | 0.024362330f, 0.025945531f, 0.027631618f, 0.029427276f, | |||
1977 | 0.031339626f, 0.033376252f, 0.035545228f, 0.037855157f, | |||
1978 | 0.040315199f, 0.042935108f, 0.045725273f, 0.048696758f, | |||
1979 | 0.051861348f, 0.055231591f, 0.058820850f, 0.062643361f, | |||
1980 | 0.066714279f, 0.071049749f, 0.075666962f, 0.080584227f, | |||
1981 | 0.085821044f, 0.091398179f, 0.097337747f, 0.10366330f, | |||
1982 | 0.11039993f, 0.11757434f, 0.12521498f, 0.13335215f, | |||
1983 | 0.14201813f, 0.15124727f, 0.16107617f, 0.17154380f, | |||
1984 | 0.18269168f, 0.19456402f, 0.20720788f, 0.22067342f, | |||
1985 | 0.23501402f, 0.25028656f, 0.26655159f, 0.28387361f, | |||
1986 | 0.30232132f, 0.32196786f, 0.34289114f, 0.36517414f, | |||
1987 | 0.38890521f, 0.41417847f, 0.44109412f, 0.46975890f, | |||
1988 | 0.50028648f, 0.53279791f, 0.56742212f, 0.60429640f, | |||
1989 | 0.64356699f, 0.68538959f, 0.72993007f, 0.77736504f, | |||
1990 | 0.82788260f, 0.88168307f, 0.9389798f, 1.0f | |||
1991 | }; | |||
1992 | ||||
1993 | ||||
1994 | // @OPTIMIZE: if you want to replace this bresenham line-drawing routine, | |||
1995 | // note that you must produce bit-identical output to decode correctly; | |||
1996 | // this specific sequence of operations is specified in the spec (it's | |||
1997 | // drawing integer-quantized frequency-space lines that the encoder | |||
1998 | // expects to be exactly the same) | |||
1999 | // ... also, isn't the whole point of Bresenham's algorithm to NOT | |||
2000 | // have to divide in the setup? sigh. | |||
2001 | #ifndef STB_VORBIS_NO_DEFER_FLOOR | |||
2002 | #define LINE_OP(a,b)a *= b a *= b | |||
2003 | #else | |||
2004 | #define LINE_OP(a,b)a *= b a = b | |||
2005 | #endif | |||
2006 | ||||
2007 | #ifdef STB_VORBIS_DIVIDE_TABLE | |||
2008 | #define DIVTAB_NUMER 32 | |||
2009 | #define DIVTAB_DENOM 64 | |||
2010 | int8 integer_divide_table[DIVTAB_NUMER][DIVTAB_DENOM]; // 2KB | |||
2011 | #endif | |||
2012 | ||||
2013 | static __forceinlineinline void draw_line(float *output, int x0, int y0, int x1, int y1, int n) | |||
2014 | { | |||
2015 | int dy = y1 - y0; | |||
2016 | int adx = x1 - x0; | |||
2017 | int ady = abs(dy); | |||
2018 | int base; | |||
2019 | int x=x0,y=y0; | |||
2020 | int err = 0; | |||
2021 | int sy; | |||
2022 | ||||
2023 | #ifdef STB_VORBIS_DIVIDE_TABLE | |||
2024 | if (adx < DIVTAB_DENOM && ady < DIVTAB_NUMER) { | |||
2025 | if (dy < 0) { | |||
2026 | base = -integer_divide_table[ady][adx]; | |||
2027 | sy = base-1; | |||
2028 | } else { | |||
2029 | base = integer_divide_table[ady][adx]; | |||
2030 | sy = base+1; | |||
2031 | } | |||
2032 | } else { | |||
2033 | base = dy / adx; | |||
2034 | if (dy < 0) | |||
2035 | sy = base - 1; | |||
2036 | else | |||
2037 | sy = base+1; | |||
2038 | } | |||
2039 | #else | |||
2040 | base = dy / adx; | |||
2041 | if (dy < 0) | |||
2042 | sy = base - 1; | |||
2043 | else | |||
2044 | sy = base+1; | |||
2045 | #endif | |||
2046 | ady -= abs(base) * adx; | |||
2047 | if (x1 > n) x1 = n; | |||
2048 | LINE_OP(output[x], inverse_db_table[y])output[x] *= inverse_db_table[y]; | |||
2049 | for (++x; x < x1; ++x) { | |||
2050 | err += ady; | |||
2051 | if (err >= adx) { | |||
2052 | err -= adx; | |||
2053 | y += sy; | |||
2054 | } else | |||
2055 | y += base; | |||
2056 | LINE_OP(output[x], inverse_db_table[y])output[x] *= inverse_db_table[y]; | |||
2057 | } | |||
2058 | } | |||
2059 | ||||
2060 | static int residue_decode(vorb *f, Codebook *book, float *target, int offset, int n, int rtype) | |||
2061 | { | |||
2062 | int k; | |||
2063 | if (rtype == 0) { | |||
2064 | int step = n / book->dimensions; | |||
2065 | for (k=0; k < step; ++k) | |||
2066 | if (!codebook_decode_step(f, book, target+offset+k, n-offset-k, step)) | |||
2067 | return FALSE0; | |||
2068 | } else { | |||
2069 | for (k=0; k < n; ) { | |||
2070 | if (!codebook_decode(f, book, target+offset, n-k)) | |||
2071 | return FALSE0; | |||
2072 | k += book->dimensions; | |||
2073 | offset += book->dimensions; | |||
2074 | } | |||
2075 | } | |||
2076 | return TRUE1; | |||
2077 | } | |||
2078 | ||||
2079 | static void decode_residue(vorb *f, float *residue_buffers[], int ch, int n, int rn, uint8 *do_not_decode) | |||
2080 | { | |||
2081 | int i,j,pass; | |||
2082 | Residue *r = f->residue_config + rn; | |||
2083 | int rtype = f->residue_types[rn]; | |||
2084 | int c = r->classbook; | |||
2085 | int classwords = f->codebooks[c].dimensions; | |||
2086 | int n_read = r->end - r->begin; | |||
2087 | int part_read = n_read / r->part_size; | |||
2088 | int temp_alloc_point = temp_alloc_save(f)((f)->temp_offset); | |||
2089 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2090 | uint8 ***part_classdata = (uint8 ***) temp_block_array(f,f->channels, part_read * sizeof(**part_classdata))make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(f->channels*(sizeof(void *)+(part_read * sizeof(**part_classdata ))))) : alloca((f->channels*(sizeof(void *)+(part_read * sizeof (**part_classdata)))))), f->channels, part_read * sizeof(* *part_classdata)); | |||
2091 | #else | |||
2092 | int **classifications = (int **) temp_block_array(f,f->channels, part_read * sizeof(**classifications))make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(f->channels*(sizeof(void *)+(part_read * sizeof(**classifications ))))) : alloca((f->channels*(sizeof(void *)+(part_read * sizeof (**classifications)))))), f->channels, part_read * sizeof( **classifications)); | |||
2093 | #endif | |||
2094 | ||||
2095 | stb_prof(2)(void)0; | |||
2096 | for (i=0; i < ch; ++i) | |||
2097 | if (!do_not_decode[i]) | |||
2098 | memset(residue_buffers[i], 0, sizeof(float) * n); | |||
2099 | ||||
2100 | if (rtype == 2 && ch != 1) { | |||
2101 | int len = ch * n; | |||
2102 | (void)len; | |||
2103 | for (j=0; j < ch; ++j) | |||
2104 | if (!do_not_decode[j]) | |||
2105 | break; | |||
2106 | if (j == ch) | |||
2107 | goto done; | |||
2108 | ||||
2109 | stb_prof(3)(void)0; | |||
2110 | for (pass=0; pass < 8; ++pass) { | |||
2111 | int pcount = 0, class_set = 0; | |||
2112 | if (ch == 2) { | |||
2113 | stb_prof(13)(void)0; | |||
2114 | while (pcount < part_read) { | |||
2115 | int z = r->begin + pcount*r->part_size; | |||
2116 | int c_inter = (z & 1), p_inter = z>>1; | |||
2117 | if (pass == 0) { | |||
2118 | Codebook *c = f->codebooks+r->classbook; | |||
2119 | int q; | |||
2120 | DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];; | |||
2121 | if (q == EOP(-1)) goto done; | |||
2122 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2123 | part_classdata[0][class_set] = r->classdata[q]; | |||
2124 | #else | |||
2125 | for (i=classwords-1; i >= 0; --i) { | |||
2126 | classifications[0][i+pcount] = q % r->classifications; | |||
2127 | q /= r->classifications; | |||
2128 | } | |||
2129 | #endif | |||
2130 | } | |||
2131 | stb_prof(5)(void)0; | |||
2132 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { | |||
2133 | int z = r->begin + pcount*r->part_size; | |||
2134 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2135 | int c = part_classdata[0][class_set][i]; | |||
2136 | #else | |||
2137 | int c = classifications[0][pcount]; | |||
2138 | #endif | |||
2139 | int b = r->residue_books[c][pass]; | |||
2140 | if (b >= 0) { | |||
2141 | Codebook *book = f->codebooks + b; | |||
2142 | stb_prof(20)(void)0; // accounts for X time | |||
2143 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
2144 | if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size)) | |||
2145 | goto done; | |||
2146 | #else | |||
2147 | // saves 1% | |||
2148 | if (!codebook_decode_deinterleave_repeat_2(f, book, residue_buffers, &c_inter, &p_inter, n, r->part_size)) | |||
2149 | goto done; | |||
2150 | #endif | |||
2151 | stb_prof(7)(void)0; | |||
2152 | } else { | |||
2153 | z += r->part_size; | |||
2154 | c_inter = z & 1; | |||
2155 | p_inter = z >> 1; | |||
2156 | } | |||
2157 | } | |||
2158 | stb_prof(8)(void)0; | |||
2159 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2160 | ++class_set; | |||
2161 | #endif | |||
2162 | } | |||
2163 | } else if (ch == 1) { | |||
2164 | while (pcount < part_read) { | |||
2165 | int z = r->begin + pcount*r->part_size; | |||
2166 | int c_inter = 0, p_inter = z; | |||
2167 | if (pass == 0) { | |||
2168 | Codebook *c = f->codebooks+r->classbook; | |||
2169 | int q; | |||
2170 | DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];; | |||
2171 | if (q == EOP(-1)) goto done; | |||
2172 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2173 | part_classdata[0][class_set] = r->classdata[q]; | |||
2174 | #else | |||
2175 | for (i=classwords-1; i >= 0; --i) { | |||
2176 | classifications[0][i+pcount] = q % r->classifications; | |||
2177 | q /= r->classifications; | |||
2178 | } | |||
2179 | #endif | |||
2180 | } | |||
2181 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { | |||
2182 | int z = r->begin + pcount*r->part_size; | |||
2183 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2184 | int c = part_classdata[0][class_set][i]; | |||
2185 | #else | |||
2186 | int c = classifications[0][pcount]; | |||
2187 | #endif | |||
2188 | int b = r->residue_books[c][pass]; | |||
2189 | if (b >= 0) { | |||
2190 | Codebook *book = f->codebooks + b; | |||
2191 | stb_prof(22)(void)0; | |||
2192 | if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size)) | |||
2193 | goto done; | |||
2194 | stb_prof(3)(void)0; | |||
2195 | } else { | |||
2196 | z += r->part_size; | |||
2197 | c_inter = 0; | |||
2198 | p_inter = z; | |||
2199 | } | |||
2200 | } | |||
2201 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2202 | ++class_set; | |||
2203 | #endif | |||
2204 | } | |||
2205 | } else { | |||
2206 | while (pcount < part_read) { | |||
2207 | int z = r->begin + pcount*r->part_size; | |||
2208 | int c_inter = z % ch, p_inter = z/ch; | |||
2209 | if (pass == 0) { | |||
2210 | Codebook *c = f->codebooks+r->classbook; | |||
2211 | int q; | |||
2212 | DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];; | |||
2213 | if (q == EOP(-1)) goto done; | |||
2214 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2215 | part_classdata[0][class_set] = r->classdata[q]; | |||
2216 | #else | |||
2217 | for (i=classwords-1; i >= 0; --i) { | |||
2218 | classifications[0][i+pcount] = q % r->classifications; | |||
2219 | q /= r->classifications; | |||
2220 | } | |||
2221 | #endif | |||
2222 | } | |||
2223 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { | |||
2224 | int z = r->begin + pcount*r->part_size; | |||
2225 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2226 | int c = part_classdata[0][class_set][i]; | |||
2227 | #else | |||
2228 | int c = classifications[0][pcount]; | |||
2229 | #endif | |||
2230 | int b = r->residue_books[c][pass]; | |||
2231 | if (b >= 0) { | |||
2232 | Codebook *book = f->codebooks + b; | |||
2233 | stb_prof(22)(void)0; | |||
2234 | if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size)) | |||
2235 | goto done; | |||
2236 | stb_prof(3)(void)0; | |||
2237 | } else { | |||
2238 | z += r->part_size; | |||
2239 | c_inter = z % ch; | |||
2240 | p_inter = z / ch; | |||
2241 | } | |||
2242 | } | |||
2243 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2244 | ++class_set; | |||
2245 | #endif | |||
2246 | } | |||
2247 | } | |||
2248 | } | |||
2249 | goto done; | |||
2250 | } | |||
2251 | stb_prof(9)(void)0; | |||
2252 | ||||
2253 | for (pass=0; pass < 8; ++pass) { | |||
2254 | int pcount = 0, class_set=0; | |||
2255 | while (pcount < part_read) { | |||
2256 | if (pass == 0) { | |||
2257 | for (j=0; j < ch; ++j) { | |||
2258 | if (!do_not_decode[j]) { | |||
2259 | Codebook *c = f->codebooks+r->classbook; | |||
2260 | int temp; | |||
2261 | DECODE(temp,f,c)if (f->valid_bits < 10) prep_huffman(f); temp = f->acc & ((1 << 10) - 1); temp = c->fast_huffman[temp] ; if (temp >= 0) { int n = c->codeword_lengths[temp]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; temp = -1; } } else { temp = codebook_decode_scalar_raw(f,c); } if (c->sparse) temp = c ->sorted_values[temp];; | |||
2262 | if (temp == EOP(-1)) goto done; | |||
2263 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2264 | part_classdata[j][class_set] = r->classdata[temp]; | |||
2265 | #else | |||
2266 | for (i=classwords-1; i >= 0; --i) { | |||
2267 | classifications[j][i+pcount] = temp % r->classifications; | |||
2268 | temp /= r->classifications; | |||
2269 | } | |||
2270 | #endif | |||
2271 | } | |||
2272 | } | |||
2273 | } | |||
2274 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { | |||
2275 | for (j=0; j < ch; ++j) { | |||
2276 | if (!do_not_decode[j]) { | |||
2277 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2278 | int c = part_classdata[j][class_set][i]; | |||
2279 | #else | |||
2280 | int c = classifications[j][pcount]; | |||
2281 | #endif | |||
2282 | int b = r->residue_books[c][pass]; | |||
2283 | if (b >= 0) { | |||
2284 | float *target = residue_buffers[j]; | |||
2285 | int offset = r->begin + pcount * r->part_size; | |||
2286 | int n = r->part_size; | |||
2287 | Codebook *book = f->codebooks + b; | |||
2288 | if (!residue_decode(f, book, target, offset, n, rtype)) | |||
2289 | goto done; | |||
2290 | } | |||
2291 | } | |||
2292 | } | |||
2293 | } | |||
2294 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
2295 | ++class_set; | |||
2296 | #endif | |||
2297 | } | |||
2298 | } | |||
2299 | done: | |||
2300 | stb_prof(0)(void)0; | |||
2301 | temp_alloc_restore(f,temp_alloc_point)((f)->temp_offset = (temp_alloc_point)); | |||
2302 | } | |||
2303 | ||||
2304 | ||||
2305 | #if 0 | |||
2306 | // slow way for debugging | |||
2307 | void inverse_mdct_slow(float *buffer, int n) | |||
2308 | { | |||
2309 | int i,j; | |||
2310 | int n2 = n >> 1; | |||
2311 | float *x = (float *) malloc(sizeof(*x) * n2); | |||
2312 | memcpy(x, buffer, sizeof(*x) * n2); | |||
2313 | for (i=0; i < n; ++i) { | |||
2314 | float acc = 0; | |||
2315 | for (j=0; j < n2; ++j) | |||
2316 | // formula from paper: | |||
2317 | //acc += n/4.0f * x[j] * (float) cos(M_PI / 2 / n * (2 * i + 1 + n/2.0)*(2*j+1)); | |||
2318 | // formula from wikipedia | |||
2319 | //acc += 2.0f / n2 * x[j] * (float) cos(M_PI/n2 * (i + 0.5 + n2/2)*(j + 0.5)); | |||
2320 | // these are equivalent, except the formula from the paper inverts the multiplier! | |||
2321 | // however, what actually works is NO MULTIPLIER!?! | |||
2322 | //acc += 64 * 2.0f / n2 * x[j] * (float) cos(M_PI/n2 * (i + 0.5 + n2/2)*(j + 0.5)); | |||
2323 | acc += x[j] * (float) cos(M_PI3.14159265358979323846 / 2 / n * (2 * i + 1 + n/2.0)*(2*j+1)); | |||
2324 | buffer[i] = acc; | |||
2325 | } | |||
2326 | free(x); | |||
2327 | } | |||
2328 | #elif 0 | |||
2329 | // same as above, but just barely able to run in real time on modern machines | |||
2330 | void inverse_mdct_slow(float *buffer, int n, vorb *f, int blocktype) | |||
2331 | { | |||
2332 | float mcos[16384]; | |||
2333 | int i,j; | |||
2334 | int n2 = n >> 1, nmask = (n << 2) -1; | |||
2335 | float *x = (float *) malloc(sizeof(*x) * n2); | |||
2336 | memcpy(x, buffer, sizeof(*x) * n2); | |||
2337 | for (i=0; i < 4*n; ++i) | |||
2338 | mcos[i] = (float) cos(M_PI3.14159265358979323846 / 2 * i / n); | |||
2339 | ||||
2340 | for (i=0; i < n; ++i) { | |||
2341 | float acc = 0; | |||
2342 | for (j=0; j < n2; ++j) | |||
2343 | acc += x[j] * mcos[(2 * i + 1 + n2)*(2*j+1) & nmask]; | |||
2344 | buffer[i] = acc; | |||
2345 | } | |||
2346 | free(x); | |||
2347 | } | |||
2348 | #else | |||
2349 | // transform to use a slow dct-iv; this is STILL basically trivial, | |||
2350 | // but only requires half as many ops | |||
2351 | void dct_iv_slow(float *buffer, int n) | |||
2352 | { | |||
2353 | float mcos[16384]; | |||
2354 | float x[2048]; | |||
2355 | int i,j; | |||
2356 | int n2 = n >> 1, nmask = (n << 3) - 1; | |||
2357 | (void)n2; | |||
2358 | memcpy(x, buffer, sizeof(*x) * n); | |||
2359 | for (i=0; i < 8*n; ++i) | |||
2360 | mcos[i] = (float) cos(M_PI3.14159265358979323846 / 4 * i / n); | |||
2361 | for (i=0; i < n; ++i) { | |||
2362 | float acc = 0; | |||
2363 | for (j=0; j < n; ++j) | |||
2364 | acc += x[j] * mcos[((2 * i + 1)*(2*j+1)) & nmask]; | |||
2365 | //acc += x[j] * cos(M_PI / n * (i + 0.5) * (j + 0.5)); | |||
2366 | buffer[i] = acc; | |||
2367 | } | |||
2368 | } | |||
2369 | ||||
2370 | void inverse_mdct_slow(float *buffer, int n, vorb *f, int blocktype) | |||
2371 | { | |||
2372 | int i, n4 = n >> 2, n2 = n >> 1, n3_4 = n - n4; | |||
2373 | float temp[4096]; | |||
2374 | ||||
2375 | memcpy(temp, buffer, n2 * sizeof(float)); | |||
2376 | dct_iv_slow(temp, n2); // returns -c'-d, a-b' | |||
2377 | ||||
2378 | for (i=0; i < n4 ; ++i) buffer[i] = temp[i+n4]; // a-b' | |||
2379 | for ( ; i < n3_4; ++i) buffer[i] = -temp[n3_4 - i - 1]; // b-a', c+d' | |||
2380 | for ( ; i < n ; ++i) buffer[i] = -temp[i - n3_4]; // c'+d | |||
2381 | } | |||
2382 | #endif | |||
2383 | ||||
2384 | #ifndef LIBVORBIS_MDCT0 | |||
2385 | #define LIBVORBIS_MDCT0 0 | |||
2386 | #endif | |||
2387 | ||||
2388 | #if LIBVORBIS_MDCT0 | |||
2389 | // directly call the vorbis MDCT using an interface documented | |||
2390 | // by Jeff Roberts... useful for performance comparison | |||
2391 | typedef struct | |||
2392 | { | |||
2393 | int n; | |||
2394 | int log2n; | |||
2395 | ||||
2396 | float *trig; | |||
2397 | int *bitrev; | |||
2398 | ||||
2399 | float scale; | |||
2400 | } mdct_lookup; | |||
2401 | ||||
2402 | extern void mdct_init(mdct_lookup *lookup, int n); | |||
2403 | extern void mdct_clear(mdct_lookup *l); | |||
2404 | extern void mdct_backward(mdct_lookup *init, float *in, float *out); | |||
2405 | ||||
2406 | mdct_lookup M1,M2; | |||
2407 | ||||
2408 | void inverse_mdct(float *buffer, int n, vorb *f, int blocktype) | |||
2409 | { | |||
2410 | mdct_lookup *M; | |||
2411 | if (M1.n == n) M = &M1; | |||
2412 | else if (M2.n == n) M = &M2; | |||
2413 | else if (M1.n == 0) { mdct_init(&M1, n); M = &M1; } | |||
2414 | else { | |||
2415 | if (M2.n) __asm int 3; | |||
2416 | mdct_init(&M2, n); | |||
2417 | M = &M2; | |||
2418 | } | |||
2419 | ||||
2420 | mdct_backward(M, buffer, buffer); | |||
2421 | } | |||
2422 | #endif | |||
2423 | ||||
2424 | ||||
2425 | // the following were split out into separate functions while optimizing; | |||
2426 | // they could be pushed back up but eh. __forceinline showed no change; | |||
2427 | // they're probably already being inlined. | |||
2428 | static void imdct_step3_iter0_loop(int n, float *e, int i_off, int k_off, float *A) | |||
2429 | { | |||
2430 | float *ee0 = e + i_off; | |||
2431 | float *ee2 = ee0 + k_off; | |||
2432 | int i; | |||
2433 | ||||
2434 | assert((n & 3) == 0)(((n & 3) == 0) ? (void)0 : _assert("(n & 3) == 0", "src/siege/internal/stb/stb_vorbis.c" , 2434)); | |||
2435 | for (i=(n>>2); i > 0; --i) { | |||
2436 | float k00_20, k01_21; | |||
2437 | k00_20 = ee0[ 0] - ee2[ 0]; | |||
2438 | k01_21 = ee0[-1] - ee2[-1]; | |||
2439 | ee0[ 0] += ee2[ 0];//ee0[ 0] = ee0[ 0] + ee2[ 0]; | |||
2440 | ee0[-1] += ee2[-1];//ee0[-1] = ee0[-1] + ee2[-1]; | |||
2441 | ee2[ 0] = k00_20 * A[0] - k01_21 * A[1]; | |||
2442 | ee2[-1] = k01_21 * A[0] + k00_20 * A[1]; | |||
2443 | A += 8; | |||
2444 | ||||
2445 | k00_20 = ee0[-2] - ee2[-2]; | |||
2446 | k01_21 = ee0[-3] - ee2[-3]; | |||
2447 | ee0[-2] += ee2[-2];//ee0[-2] = ee0[-2] + ee2[-2]; | |||
2448 | ee0[-3] += ee2[-3];//ee0[-3] = ee0[-3] + ee2[-3]; | |||
2449 | ee2[-2] = k00_20 * A[0] - k01_21 * A[1]; | |||
2450 | ee2[-3] = k01_21 * A[0] + k00_20 * A[1]; | |||
2451 | A += 8; | |||
2452 | ||||
2453 | k00_20 = ee0[-4] - ee2[-4]; | |||
2454 | k01_21 = ee0[-5] - ee2[-5]; | |||
2455 | ee0[-4] += ee2[-4];//ee0[-4] = ee0[-4] + ee2[-4]; | |||
2456 | ee0[-5] += ee2[-5];//ee0[-5] = ee0[-5] + ee2[-5]; | |||
2457 | ee2[-4] = k00_20 * A[0] - k01_21 * A[1]; | |||
2458 | ee2[-5] = k01_21 * A[0] + k00_20 * A[1]; | |||
2459 | A += 8; | |||
2460 | ||||
2461 | k00_20 = ee0[-6] - ee2[-6]; | |||
2462 | k01_21 = ee0[-7] - ee2[-7]; | |||
2463 | ee0[-6] += ee2[-6];//ee0[-6] = ee0[-6] + ee2[-6]; | |||
2464 | ee0[-7] += ee2[-7];//ee0[-7] = ee0[-7] + ee2[-7]; | |||
2465 | ee2[-6] = k00_20 * A[0] - k01_21 * A[1]; | |||
2466 | ee2[-7] = k01_21 * A[0] + k00_20 * A[1]; | |||
2467 | A += 8; | |||
2468 | ee0 -= 8; | |||
2469 | ee2 -= 8; | |||
2470 | } | |||
2471 | } | |||
2472 | ||||
2473 | static void imdct_step3_inner_r_loop(int lim, float *e, int d0, int k_off, float *A, int k1) | |||
2474 | { | |||
2475 | int i; | |||
2476 | float k00_20, k01_21; | |||
2477 | ||||
2478 | float *e0 = e + d0; | |||
2479 | float *e2 = e0 + k_off; | |||
2480 | ||||
2481 | for (i=lim >> 2; i > 0; --i) { | |||
2482 | k00_20 = e0[-0] - e2[-0]; | |||
2483 | k01_21 = e0[-1] - e2[-1]; | |||
2484 | e0[-0] += e2[-0];//e0[-0] = e0[-0] + e2[-0]; | |||
2485 | e0[-1] += e2[-1];//e0[-1] = e0[-1] + e2[-1]; | |||
2486 | e2[-0] = (k00_20)*A[0] - (k01_21) * A[1]; | |||
2487 | e2[-1] = (k01_21)*A[0] + (k00_20) * A[1]; | |||
2488 | ||||
2489 | A += k1; | |||
2490 | ||||
2491 | k00_20 = e0[-2] - e2[-2]; | |||
2492 | k01_21 = e0[-3] - e2[-3]; | |||
2493 | e0[-2] += e2[-2];//e0[-2] = e0[-2] + e2[-2]; | |||
2494 | e0[-3] += e2[-3];//e0[-3] = e0[-3] + e2[-3]; | |||
2495 | e2[-2] = (k00_20)*A[0] - (k01_21) * A[1]; | |||
2496 | e2[-3] = (k01_21)*A[0] + (k00_20) * A[1]; | |||
2497 | ||||
2498 | A += k1; | |||
2499 | ||||
2500 | k00_20 = e0[-4] - e2[-4]; | |||
2501 | k01_21 = e0[-5] - e2[-5]; | |||
2502 | e0[-4] += e2[-4];//e0[-4] = e0[-4] + e2[-4]; | |||
2503 | e0[-5] += e2[-5];//e0[-5] = e0[-5] + e2[-5]; | |||
2504 | e2[-4] = (k00_20)*A[0] - (k01_21) * A[1]; | |||
2505 | e2[-5] = (k01_21)*A[0] + (k00_20) * A[1]; | |||
2506 | ||||
2507 | A += k1; | |||
2508 | ||||
2509 | k00_20 = e0[-6] - e2[-6]; | |||
2510 | k01_21 = e0[-7] - e2[-7]; | |||
2511 | e0[-6] += e2[-6];//e0[-6] = e0[-6] + e2[-6]; | |||
2512 | e0[-7] += e2[-7];//e0[-7] = e0[-7] + e2[-7]; | |||
2513 | e2[-6] = (k00_20)*A[0] - (k01_21) * A[1]; | |||
2514 | e2[-7] = (k01_21)*A[0] + (k00_20) * A[1]; | |||
2515 | ||||
2516 | e0 -= 8; | |||
2517 | e2 -= 8; | |||
2518 | ||||
2519 | A += k1; | |||
2520 | } | |||
2521 | } | |||
2522 | ||||
2523 | static void imdct_step3_inner_s_loop(int n, float *e, int i_off, int k_off, float *A, int a_off, int k0) | |||
2524 | { | |||
2525 | int i; | |||
2526 | float A0 = A[0]; | |||
2527 | float A1 = A[0+1]; | |||
2528 | float A2 = A[0+a_off]; | |||
2529 | float A3 = A[0+a_off+1]; | |||
2530 | float A4 = A[0+a_off*2+0]; | |||
2531 | float A5 = A[0+a_off*2+1]; | |||
2532 | float A6 = A[0+a_off*3+0]; | |||
2533 | float A7 = A[0+a_off*3+1]; | |||
2534 | ||||
2535 | float k00,k11; | |||
2536 | ||||
2537 | float *ee0 = e +i_off; | |||
2538 | float *ee2 = ee0+k_off; | |||
2539 | ||||
2540 | for (i=n; i > 0; --i) { | |||
2541 | k00 = ee0[ 0] - ee2[ 0]; | |||
2542 | k11 = ee0[-1] - ee2[-1]; | |||
2543 | ee0[ 0] = ee0[ 0] + ee2[ 0]; | |||
2544 | ee0[-1] = ee0[-1] + ee2[-1]; | |||
2545 | ee2[ 0] = (k00) * A0 - (k11) * A1; | |||
2546 | ee2[-1] = (k11) * A0 + (k00) * A1; | |||
2547 | ||||
2548 | k00 = ee0[-2] - ee2[-2]; | |||
2549 | k11 = ee0[-3] - ee2[-3]; | |||
2550 | ee0[-2] = ee0[-2] + ee2[-2]; | |||
2551 | ee0[-3] = ee0[-3] + ee2[-3]; | |||
2552 | ee2[-2] = (k00) * A2 - (k11) * A3; | |||
2553 | ee2[-3] = (k11) * A2 + (k00) * A3; | |||
2554 | ||||
2555 | k00 = ee0[-4] - ee2[-4]; | |||
2556 | k11 = ee0[-5] - ee2[-5]; | |||
2557 | ee0[-4] = ee0[-4] + ee2[-4]; | |||
2558 | ee0[-5] = ee0[-5] + ee2[-5]; | |||
2559 | ee2[-4] = (k00) * A4 - (k11) * A5; | |||
2560 | ee2[-5] = (k11) * A4 + (k00) * A5; | |||
2561 | ||||
2562 | k00 = ee0[-6] - ee2[-6]; | |||
2563 | k11 = ee0[-7] - ee2[-7]; | |||
2564 | ee0[-6] = ee0[-6] + ee2[-6]; | |||
2565 | ee0[-7] = ee0[-7] + ee2[-7]; | |||
2566 | ee2[-6] = (k00) * A6 - (k11) * A7; | |||
2567 | ee2[-7] = (k11) * A6 + (k00) * A7; | |||
2568 | ||||
2569 | ee0 -= k0; | |||
2570 | ee2 -= k0; | |||
2571 | } | |||
2572 | } | |||
2573 | ||||
2574 | static __forceinlineinline void iter_54(float *z) | |||
2575 | { | |||
2576 | float k00,k11,k22,k33; | |||
2577 | float y0,y1,y2,y3; | |||
2578 | ||||
2579 | k00 = z[ 0] - z[-4]; | |||
2580 | y0 = z[ 0] + z[-4]; | |||
2581 | y2 = z[-2] + z[-6]; | |||
2582 | k22 = z[-2] - z[-6]; | |||
2583 | ||||
2584 | z[-0] = y0 + y2; // z0 + z4 + z2 + z6 | |||
2585 | z[-2] = y0 - y2; // z0 + z4 - z2 - z6 | |||
2586 | ||||
2587 | // done with y0,y2 | |||
2588 | ||||
2589 | k33 = z[-3] - z[-7]; | |||
2590 | ||||
2591 | z[-4] = k00 + k33; // z0 - z4 + z3 - z7 | |||
2592 | z[-6] = k00 - k33; // z0 - z4 - z3 + z7 | |||
2593 | ||||
2594 | // done with k33 | |||
2595 | ||||
2596 | k11 = z[-1] - z[-5]; | |||
2597 | y1 = z[-1] + z[-5]; | |||
2598 | y3 = z[-3] + z[-7]; | |||
2599 | ||||
2600 | z[-1] = y1 + y3; // z1 + z5 + z3 + z7 | |||
2601 | z[-3] = y1 - y3; // z1 + z5 - z3 - z7 | |||
2602 | z[-5] = k11 - k22; // z1 - z5 + z2 - z6 | |||
2603 | z[-7] = k11 + k22; // z1 - z5 - z2 + z6 | |||
2604 | } | |||
2605 | ||||
2606 | static void imdct_step3_inner_s_loop_ld654(int n, float *e, int i_off, float *A, int base_n) | |||
2607 | { | |||
2608 | int k_off = -8; | |||
2609 | (void)k_off; | |||
2610 | int a_off = base_n >> 3; | |||
2611 | float A2 = A[0+a_off]; | |||
2612 | float *z = e + i_off; | |||
2613 | float *base = z - 16 * n; | |||
2614 | ||||
2615 | while (z > base) { | |||
2616 | float k00,k11; | |||
2617 | ||||
2618 | k00 = z[-0] - z[-8]; | |||
2619 | k11 = z[-1] - z[-9]; | |||
2620 | z[-0] = z[-0] + z[-8]; | |||
2621 | z[-1] = z[-1] + z[-9]; | |||
2622 | z[-8] = k00; | |||
2623 | z[-9] = k11 ; | |||
2624 | ||||
2625 | k00 = z[ -2] - z[-10]; | |||
2626 | k11 = z[ -3] - z[-11]; | |||
2627 | z[ -2] = z[ -2] + z[-10]; | |||
2628 | z[ -3] = z[ -3] + z[-11]; | |||
2629 | z[-10] = (k00+k11) * A2; | |||
2630 | z[-11] = (k11-k00) * A2; | |||
2631 | ||||
2632 | k00 = z[-12] - z[ -4]; // reverse to avoid a unary negation | |||
2633 | k11 = z[ -5] - z[-13]; | |||
2634 | z[ -4] = z[ -4] + z[-12]; | |||
2635 | z[ -5] = z[ -5] + z[-13]; | |||
2636 | z[-12] = k11; | |||
2637 | z[-13] = k00; | |||
2638 | ||||
2639 | k00 = z[-14] - z[ -6]; // reverse to avoid a unary negation | |||
2640 | k11 = z[ -7] - z[-15]; | |||
2641 | z[ -6] = z[ -6] + z[-14]; | |||
2642 | z[ -7] = z[ -7] + z[-15]; | |||
2643 | z[-14] = (k00+k11) * A2; | |||
2644 | z[-15] = (k00-k11) * A2; | |||
2645 | ||||
2646 | iter_54(z); | |||
2647 | iter_54(z-8); | |||
2648 | z -= 16; | |||
2649 | } | |||
2650 | } | |||
2651 | ||||
2652 | static void inverse_mdct(float *buffer, int n, vorb *f, int blocktype) | |||
2653 | { | |||
2654 | int n2 = n >> 1, n4 = n >> 2, n8 = n >> 3, l; | |||
2655 | int n3_4 = n - n4, ld; | |||
2656 | (void)n3_4; | |||
2657 | // @OPTIMIZE: reduce register pressure by using fewer variables? | |||
2658 | int save_point = temp_alloc_save(f)((f)->temp_offset); | |||
2659 | float *buf2 = (float *) temp_alloc(f, n2 * sizeof(*buf2))(f->alloc.alloc_buffer ? setup_temp_malloc(f,n2 * sizeof(* buf2)) : alloca(n2 * sizeof(*buf2))); | |||
2660 | float *u=NULL((void*)0),*v=NULL((void*)0); | |||
2661 | // twiddle factors | |||
2662 | float *A = f->A[blocktype]; | |||
2663 | ||||
2664 | // IMDCT algorithm from "The use of multirate filter banks for coding of high quality digital audio" | |||
2665 | // See notes about bugs in that paper in less-optimal implementation 'inverse_mdct_old' after this function. | |||
2666 | ||||
2667 | // kernel from paper | |||
2668 | ||||
2669 | ||||
2670 | // merged: | |||
2671 | // copy and reflect spectral data | |||
2672 | // step 0 | |||
2673 | ||||
2674 | // note that it turns out that the items added together during | |||
2675 | // this step are, in fact, being added to themselves (as reflected | |||
2676 | // by step 0). inexplicable inefficiency! this became obvious | |||
2677 | // once I combined the passes. | |||
2678 | ||||
2679 | // so there's a missing 'times 2' here (for adding X to itself). | |||
2680 | // this propogates through linearly to the end, where the numbers | |||
2681 | // are 1/2 too small, and need to be compensated for. | |||
2682 | ||||
2683 | { | |||
2684 | float *d,*e, *AA, *e_stop; | |||
2685 | d = &buf2[n2-2]; | |||
2686 | AA = A; | |||
2687 | e = &buffer[0]; | |||
2688 | e_stop = &buffer[n2]; | |||
2689 | while (e != e_stop) { | |||
2690 | d[1] = (e[0] * AA[0] - e[2]*AA[1]); | |||
2691 | d[0] = (e[0] * AA[1] + e[2]*AA[0]); | |||
2692 | d -= 2; | |||
2693 | AA += 2; | |||
2694 | e += 4; | |||
2695 | } | |||
2696 | ||||
2697 | e = &buffer[n2-3]; | |||
2698 | while (d >= buf2) { | |||
2699 | d[1] = (-e[2] * AA[0] - -e[0]*AA[1]); | |||
2700 | d[0] = (-e[2] * AA[1] + -e[0]*AA[0]); | |||
2701 | d -= 2; | |||
2702 | AA += 2; | |||
2703 | e -= 4; | |||
2704 | } | |||
2705 | } | |||
2706 | ||||
2707 | // now we use symbolic names for these, so that we can | |||
2708 | // possibly swap their meaning as we change which operations | |||
2709 | // are in place | |||
2710 | ||||
2711 | u = buffer; | |||
2712 | v = buf2; | |||
2713 | ||||
2714 | // step 2 (paper output is w, now u) | |||
2715 | // this could be in place, but the data ends up in the wrong | |||
2716 | // place... _somebody_'s got to swap it, so this is nominated | |||
2717 | { | |||
2718 | float *AA = &A[n2-8]; | |||
2719 | float *d0,*d1, *e0, *e1; | |||
2720 | ||||
2721 | e0 = &v[n4]; | |||
2722 | e1 = &v[0]; | |||
2723 | ||||
2724 | d0 = &u[n4]; | |||
2725 | d1 = &u[0]; | |||
2726 | ||||
2727 | while (AA >= A) { | |||
2728 | float v40_20, v41_21; | |||
2729 | ||||
2730 | v41_21 = e0[1] - e1[1]; | |||
2731 | v40_20 = e0[0] - e1[0]; | |||
2732 | d0[1] = e0[1] + e1[1]; | |||
2733 | d0[0] = e0[0] + e1[0]; | |||
2734 | d1[1] = v41_21*AA[4] - v40_20*AA[5]; | |||
2735 | d1[0] = v40_20*AA[4] + v41_21*AA[5]; | |||
2736 | ||||
2737 | v41_21 = e0[3] - e1[3]; | |||
2738 | v40_20 = e0[2] - e1[2]; | |||
2739 | d0[3] = e0[3] + e1[3]; | |||
2740 | d0[2] = e0[2] + e1[2]; | |||
2741 | d1[3] = v41_21*AA[0] - v40_20*AA[1]; | |||
2742 | d1[2] = v40_20*AA[0] + v41_21*AA[1]; | |||
2743 | ||||
2744 | AA -= 8; | |||
2745 | ||||
2746 | d0 += 4; | |||
2747 | d1 += 4; | |||
2748 | e0 += 4; | |||
2749 | e1 += 4; | |||
2750 | } | |||
2751 | } | |||
2752 | ||||
2753 | // step 3 | |||
2754 | ld = ilog(n) - 1; // ilog is off-by-one from normal definitions | |||
2755 | ||||
2756 | // optimized step 3: | |||
2757 | ||||
2758 | // the original step3 loop can be nested r inside s or s inside r; | |||
2759 | // it's written originally as s inside r, but this is dumb when r | |||
2760 | // iterates many times, and s few. So I have two copies of it and | |||
2761 | // switch between them halfway. | |||
2762 | ||||
2763 | // this is iteration 0 of step 3 | |||
2764 | imdct_step3_iter0_loop(n >> 4, u, n2-1-n4*0, -(n >> 3), A); | |||
2765 | imdct_step3_iter0_loop(n >> 4, u, n2-1-n4*1, -(n >> 3), A); | |||
2766 | ||||
2767 | // this is iteration 1 of step 3 | |||
2768 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*0, -(n >> 4), A, 16); | |||
2769 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*1, -(n >> 4), A, 16); | |||
2770 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*2, -(n >> 4), A, 16); | |||
2771 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*3, -(n >> 4), A, 16); | |||
2772 | ||||
2773 | l=2; | |||
2774 | for (; l < (ld-3)>>1; ++l) { | |||
2775 | int k0 = n >> (l+2), k0_2 = k0>>1; | |||
2776 | int lim = 1 << (l+1); | |||
2777 | int i; | |||
2778 | for (i=0; i < lim; ++i) | |||
2779 | imdct_step3_inner_r_loop(n >> (l+4), u, n2-1 - k0*i, -k0_2, A, 1 << (l+3)); | |||
2780 | } | |||
2781 | ||||
2782 | for (; l < ld-6; ++l) { | |||
2783 | int k0 = n >> (l+2), k1 = 1 << (l+3), k0_2 = k0>>1; | |||
2784 | int rlim = n >> (l+6), r; | |||
2785 | int lim = 1 << (l+1); | |||
2786 | int i_off; | |||
2787 | float *A0 = A; | |||
2788 | i_off = n2-1; | |||
2789 | for (r=rlim; r > 0; --r) { | |||
2790 | imdct_step3_inner_s_loop(lim, u, i_off, -k0_2, A0, k1, k0); | |||
2791 | A0 += k1*4; | |||
2792 | i_off -= 8; | |||
2793 | } | |||
2794 | } | |||
2795 | ||||
2796 | // iterations with count: | |||
2797 | // ld-6,-5,-4 all interleaved together | |||
2798 | // the big win comes from getting rid of needless flops | |||
2799 | // due to the constants on pass 5 & 4 being all 1 and 0; | |||
2800 | // combining them to be simultaneous to improve cache made little difference | |||
2801 | imdct_step3_inner_s_loop_ld654(n >> 5, u, n2-1, A, n); | |||
2802 | ||||
2803 | // output is u | |||
2804 | ||||
2805 | // step 4, 5, and 6 | |||
2806 | // cannot be in-place because of step 5 | |||
2807 | { | |||
2808 | uint16 *bitrev = f->bit_reverse[blocktype]; | |||
2809 | // weirdly, I'd have thought reading sequentially and writing | |||
2810 | // erratically would have been better than vice-versa, but in | |||
2811 | // fact that's not what my testing showed. (That is, with | |||
2812 | // j = bitreverse(i), do you read i and write j, or read j and write i.) | |||
2813 | ||||
2814 | float *d0 = &v[n4-4]; | |||
2815 | float *d1 = &v[n2-4]; | |||
2816 | while (d0 >= v) { | |||
2817 | int k4; | |||
2818 | ||||
2819 | k4 = bitrev[0]; | |||
2820 | d1[3] = u[k4+0]; | |||
2821 | d1[2] = u[k4+1]; | |||
2822 | d0[3] = u[k4+2]; | |||
2823 | d0[2] = u[k4+3]; | |||
2824 | ||||
2825 | k4 = bitrev[1]; | |||
2826 | d1[1] = u[k4+0]; | |||
2827 | d1[0] = u[k4+1]; | |||
2828 | d0[1] = u[k4+2]; | |||
2829 | d0[0] = u[k4+3]; | |||
2830 | ||||
2831 | d0 -= 4; | |||
2832 | d1 -= 4; | |||
2833 | bitrev += 2; | |||
2834 | } | |||
2835 | } | |||
2836 | // (paper output is u, now v) | |||
2837 | ||||
2838 | ||||
2839 | // data must be in buf2 | |||
2840 | assert(v == buf2)((v == buf2) ? (void)0 : _assert("v == buf2", "src/siege/internal/stb/stb_vorbis.c" , 2840)); | |||
2841 | ||||
2842 | // step 7 (paper output is v, now v) | |||
2843 | // this is now in place | |||
2844 | { | |||
2845 | float *C(2 | 4 | 1) = f->C(2 | 4 | 1)[blocktype]; | |||
2846 | float *d, *e; | |||
2847 | ||||
2848 | d = v; | |||
2849 | e = v + n2 - 4; | |||
2850 | ||||
2851 | while (d < e) { | |||
2852 | float a02,a11,b0,b1,b2,b3; | |||
2853 | ||||
2854 | a02 = d[0] - e[2]; | |||
2855 | a11 = d[1] + e[3]; | |||
2856 | ||||
2857 | b0 = C(2 | 4 | 1)[1]*a02 + C(2 | 4 | 1)[0]*a11; | |||
2858 | b1 = C(2 | 4 | 1)[1]*a11 - C(2 | 4 | 1)[0]*a02; | |||
2859 | ||||
2860 | b2 = d[0] + e[ 2]; | |||
2861 | b3 = d[1] - e[ 3]; | |||
2862 | ||||
2863 | d[0] = b2 + b0; | |||
2864 | d[1] = b3 + b1; | |||
2865 | e[2] = b2 - b0; | |||
2866 | e[3] = b1 - b3; | |||
2867 | ||||
2868 | a02 = d[2] - e[0]; | |||
2869 | a11 = d[3] + e[1]; | |||
2870 | ||||
2871 | b0 = C(2 | 4 | 1)[3]*a02 + C(2 | 4 | 1)[2]*a11; | |||
2872 | b1 = C(2 | 4 | 1)[3]*a11 - C(2 | 4 | 1)[2]*a02; | |||
2873 | ||||
2874 | b2 = d[2] + e[ 0]; | |||
2875 | b3 = d[3] - e[ 1]; | |||
2876 | ||||
2877 | d[2] = b2 + b0; | |||
2878 | d[3] = b3 + b1; | |||
2879 | e[0] = b2 - b0; | |||
2880 | e[1] = b1 - b3; | |||
2881 | ||||
2882 | C(2 | 4 | 1) += 4; | |||
2883 | d += 4; | |||
2884 | e -= 4; | |||
2885 | } | |||
2886 | } | |||
2887 | ||||
2888 | // data must be in buf2 | |||
2889 | ||||
2890 | ||||
2891 | // step 8+decode (paper output is X, now buffer) | |||
2892 | // this generates pairs of data a la 8 and pushes them directly through | |||
2893 | // the decode kernel (pushing rather than pulling) to avoid having | |||
2894 | // to make another pass later | |||
2895 | ||||
2896 | // this cannot POSSIBLY be in place, so we refer to the buffers directly | |||
2897 | ||||
2898 | { | |||
2899 | float *d0,*d1,*d2,*d3; | |||
2900 | ||||
2901 | float *B = f->B[blocktype] + n2 - 8; | |||
2902 | float *e = buf2 + n2 - 8; | |||
2903 | d0 = &buffer[0]; | |||
2904 | d1 = &buffer[n2-4]; | |||
2905 | d2 = &buffer[n2]; | |||
2906 | d3 = &buffer[n-4]; | |||
2907 | while (e >= v) { | |||
2908 | float p0,p1,p2,p3; | |||
2909 | ||||
2910 | p3 = e[6]*B[7] - e[7]*B[6]; | |||
2911 | p2 = -e[6]*B[6] - e[7]*B[7]; | |||
2912 | ||||
2913 | d0[0] = p3; | |||
2914 | d1[3] = - p3; | |||
2915 | d2[0] = p2; | |||
2916 | d3[3] = p2; | |||
2917 | ||||
2918 | p1 = e[4]*B[5] - e[5]*B[4]; | |||
2919 | p0 = -e[4]*B[4] - e[5]*B[5]; | |||
2920 | ||||
2921 | d0[1] = p1; | |||
2922 | d1[2] = - p1; | |||
2923 | d2[1] = p0; | |||
2924 | d3[2] = p0; | |||
2925 | ||||
2926 | p3 = e[2]*B[3] - e[3]*B[2]; | |||
2927 | p2 = -e[2]*B[2] - e[3]*B[3]; | |||
2928 | ||||
2929 | d0[2] = p3; | |||
2930 | d1[1] = - p3; | |||
2931 | d2[2] = p2; | |||
2932 | d3[1] = p2; | |||
2933 | ||||
2934 | p1 = e[0]*B[1] - e[1]*B[0]; | |||
2935 | p0 = -e[0]*B[0] - e[1]*B[1]; | |||
2936 | ||||
2937 | d0[3] = p1; | |||
2938 | d1[0] = - p1; | |||
2939 | d2[3] = p0; | |||
2940 | d3[0] = p0; | |||
2941 | ||||
2942 | B -= 8; | |||
2943 | e -= 8; | |||
2944 | d0 += 4; | |||
2945 | d2 += 4; | |||
2946 | d1 -= 4; | |||
2947 | d3 -= 4; | |||
2948 | } | |||
2949 | } | |||
2950 | ||||
2951 | temp_alloc_restore(f,save_point)((f)->temp_offset = (save_point)); | |||
2952 | } | |||
2953 | ||||
2954 | #if 0 | |||
2955 | // this is the original version of the above code, if you want to optimize it from scratch | |||
2956 | void inverse_mdct_naive(float *buffer, int n) | |||
2957 | { | |||
2958 | float s; | |||
2959 | float A[1 << 12], B[1 << 12], C(2 | 4 | 1)[1 << 11]; | |||
2960 | int i,k,k2,k4, n2 = n >> 1, n4 = n >> 2, n8 = n >> 3, l; | |||
2961 | int n3_4 = n - n4, ld; | |||
2962 | // how can they claim this only uses N words?! | |||
2963 | // oh, because they're only used sparsely, whoops | |||
2964 | float u[1 << 13], X[1 << 13], v[1 << 13], w[1 << 13]; | |||
2965 | // set up twiddle factors | |||
2966 | ||||
2967 | for (k=k2=0; k < n4; ++k,k2+=2) { | |||
2968 | A[k2 ] = (float) cos(4*k*M_PI3.14159265358979323846/n); | |||
2969 | A[k2+1] = (float) -sin(4*k*M_PI3.14159265358979323846/n); | |||
2970 | B[k2 ] = (float) cos((k2+1)*M_PI3.14159265358979323846/n/2); | |||
2971 | B[k2+1] = (float) sin((k2+1)*M_PI3.14159265358979323846/n/2); | |||
2972 | } | |||
2973 | for (k=k2=0; k < n8; ++k,k2+=2) { | |||
2974 | C(2 | 4 | 1)[k2 ] = (float) cos(2*(k2+1)*M_PI3.14159265358979323846/n); | |||
2975 | C(2 | 4 | 1)[k2+1] = (float) -sin(2*(k2+1)*M_PI3.14159265358979323846/n); | |||
2976 | } | |||
2977 | ||||
2978 | // IMDCT algorithm from "The use of multirate filter banks for coding of high quality digital audio" | |||
2979 | // Note there are bugs in that pseudocode, presumably due to them attempting | |||
2980 | // to rename the arrays nicely rather than representing the way their actual | |||
2981 | // implementation bounces buffers back and forth. As a result, even in the | |||
2982 | // "some formulars corrected" version, a direct implementation fails. These | |||
2983 | // are noted below as "paper bug". | |||
2984 | ||||
2985 | // copy and reflect spectral data | |||
2986 | for (k=0; k < n2; ++k) u[k] = buffer[k]; | |||
2987 | for ( ; k < n ; ++k) u[k] = -buffer[n - k - 1]; | |||
2988 | // kernel from paper | |||
2989 | // step 1 | |||
2990 | for (k=k2=k4=0; k < n4; k+=1, k2+=2, k4+=4) { | |||
2991 | v[n-k4-1] = (u[k4] - u[n-k4-1]) * A[k2] - (u[k4+2] - u[n-k4-3])*A[k2+1]; | |||
2992 | v[n-k4-3] = (u[k4] - u[n-k4-1]) * A[k2+1] + (u[k4+2] - u[n-k4-3])*A[k2]; | |||
2993 | } | |||
2994 | // step 2 | |||
2995 | for (k=k4=0; k < n8; k+=1, k4+=4) { | |||
2996 | w[n2+3+k4] = v[n2+3+k4] + v[k4+3]; | |||
2997 | w[n2+1+k4] = v[n2+1+k4] + v[k4+1]; | |||
2998 | w[k4+3] = (v[n2+3+k4] - v[k4+3])*A[n2-4-k4] - (v[n2+1+k4]-v[k4+1])*A[n2-3-k4]; | |||
2999 | w[k4+1] = (v[n2+1+k4] - v[k4+1])*A[n2-4-k4] + (v[n2+3+k4]-v[k4+3])*A[n2-3-k4]; | |||
3000 | } | |||
3001 | // step 3 | |||
3002 | ld = ilog(n) - 1; // ilog is off-by-one from normal definitions | |||
3003 | for (l=0; l < ld-3; ++l) { | |||
3004 | int k0 = n >> (l+2), k1 = 1 << (l+3); | |||
3005 | int rlim = n >> (l+4), r4, r; | |||
3006 | int s2lim = 1 << (l+2), s2; | |||
3007 | for (r=r4=0; r < rlim; r4+=4,++r) { | |||
3008 | for (s2=0; s2 < s2lim; s2+=2) { | |||
3009 | u[n-1-k0*s2-r4] = w[n-1-k0*s2-r4] + w[n-1-k0*(s2+1)-r4]; | |||
3010 | u[n-3-k0*s2-r4] = w[n-3-k0*s2-r4] + w[n-3-k0*(s2+1)-r4]; | |||
3011 | u[n-1-k0*(s2+1)-r4] = (w[n-1-k0*s2-r4] - w[n-1-k0*(s2+1)-r4]) * A[r*k1] | |||
3012 | - (w[n-3-k0*s2-r4] - w[n-3-k0*(s2+1)-r4]) * A[r*k1+1]; | |||
3013 | u[n-3-k0*(s2+1)-r4] = (w[n-3-k0*s2-r4] - w[n-3-k0*(s2+1)-r4]) * A[r*k1] | |||
3014 | + (w[n-1-k0*s2-r4] - w[n-1-k0*(s2+1)-r4]) * A[r*k1+1]; | |||
3015 | } | |||
3016 | } | |||
3017 | if (l+1 < ld-3) { | |||
3018 | // paper bug: ping-ponging of u&w here is omitted | |||
3019 | memcpy(w, u, sizeof(u)); | |||
3020 | } | |||
3021 | } | |||
3022 | ||||
3023 | // step 4 | |||
3024 | for (i=0; i < n8; ++i) { | |||
3025 | int j = bit_reverse(i) >> (32-ld+3); | |||
3026 | assert(j < n8)((j < n8) ? (void)0 : _assert("j < n8", "src/siege/internal/stb/stb_vorbis.c" , 3026)); | |||
3027 | if (i == j) { | |||
3028 | // paper bug: original code probably swapped in place; if copying, | |||
3029 | // need to directly copy in this case | |||
3030 | int i8 = i << 3; | |||
3031 | v[i8+1] = u[i8+1]; | |||
3032 | v[i8+3] = u[i8+3]; | |||
3033 | v[i8+5] = u[i8+5]; | |||
3034 | v[i8+7] = u[i8+7]; | |||
3035 | } else if (i < j) { | |||
3036 | int i8 = i << 3, j8 = j << 3; | |||
3037 | v[j8+1] = u[i8+1], v[i8+1] = u[j8 + 1]; | |||
3038 | v[j8+3] = u[i8+3], v[i8+3] = u[j8 + 3]; | |||
3039 | v[j8+5] = u[i8+5], v[i8+5] = u[j8 + 5]; | |||
3040 | v[j8+7] = u[i8+7], v[i8+7] = u[j8 + 7]; | |||
3041 | } | |||
3042 | } | |||
3043 | // step 5 | |||
3044 | for (k=0; k < n2; ++k) { | |||
3045 | w[k] = v[k*2+1]; | |||
3046 | } | |||
3047 | // step 6 | |||
3048 | for (k=k2=k4=0; k < n8; ++k, k2 += 2, k4 += 4) { | |||
3049 | u[n-1-k2] = w[k4]; | |||
3050 | u[n-2-k2] = w[k4+1]; | |||
3051 | u[n3_4 - 1 - k2] = w[k4+2]; | |||
3052 | u[n3_4 - 2 - k2] = w[k4+3]; | |||
3053 | } | |||
3054 | // step 7 | |||
3055 | for (k=k2=0; k < n8; ++k, k2 += 2) { | |||
3056 | v[n2 + k2 ] = ( u[n2 + k2] + u[n-2-k2] + C(2 | 4 | 1)[k2+1]*(u[n2+k2]-u[n-2-k2]) + C(2 | 4 | 1)[k2]*(u[n2+k2+1]+u[n-2-k2+1]))/2; | |||
3057 | v[n-2 - k2] = ( u[n2 + k2] + u[n-2-k2] - C(2 | 4 | 1)[k2+1]*(u[n2+k2]-u[n-2-k2]) - C(2 | 4 | 1)[k2]*(u[n2+k2+1]+u[n-2-k2+1]))/2; | |||
3058 | v[n2+1+ k2] = ( u[n2+1+k2] - u[n-1-k2] + C(2 | 4 | 1)[k2+1]*(u[n2+1+k2]+u[n-1-k2]) - C(2 | 4 | 1)[k2]*(u[n2+k2]-u[n-2-k2]))/2; | |||
3059 | v[n-1 - k2] = (-u[n2+1+k2] + u[n-1-k2] + C(2 | 4 | 1)[k2+1]*(u[n2+1+k2]+u[n-1-k2]) - C(2 | 4 | 1)[k2]*(u[n2+k2]-u[n-2-k2]))/2; | |||
3060 | } | |||
3061 | // step 8 | |||
3062 | for (k=k2=0; k < n4; ++k,k2 += 2) { | |||
3063 | X[k] = v[k2+n2]*B[k2 ] + v[k2+1+n2]*B[k2+1]; | |||
3064 | X[n2-1-k] = v[k2+n2]*B[k2+1] - v[k2+1+n2]*B[k2 ]; | |||
3065 | } | |||
3066 | ||||
3067 | // decode kernel to output | |||
3068 | // determined the following value experimentally | |||
3069 | // (by first figuring out what made inverse_mdct_slow work); then matching that here | |||
3070 | // (probably vorbis encoder premultiplies by n or n/2, to save it on the decoder?) | |||
3071 | s = 0.5; // theoretically would be n4 | |||
3072 | ||||
3073 | // [[[ note! the s value of 0.5 is compensated for by the B[] in the current code, | |||
3074 | // so it needs to use the "old" B values to behave correctly, or else | |||
3075 | // set s to 1.0 ]]] | |||
3076 | for (i=0; i < n4 ; ++i) buffer[i] = s * X[i+n4]; | |||
3077 | for ( ; i < n3_4; ++i) buffer[i] = -s * X[n3_4 - i - 1]; | |||
3078 | for ( ; i < n ; ++i) buffer[i] = -s * X[i - n3_4]; | |||
3079 | } | |||
3080 | #endif | |||
3081 | ||||
3082 | static float *get_window(vorb *f, int len) | |||
3083 | { | |||
3084 | len <<= 1; | |||
3085 | if (len == f->blocksize_0) return f->window[0]; | |||
3086 | if (len == f->blocksize_1) return f->window[1]; | |||
3087 | assert(0)((0) ? (void)0 : _assert("0", "src/siege/internal/stb/stb_vorbis.c" , 3087)); | |||
3088 | return NULL((void*)0); | |||
3089 | } | |||
3090 | ||||
3091 | #ifndef STB_VORBIS_NO_DEFER_FLOOR | |||
3092 | typedef int16 YTYPE; | |||
3093 | #else | |||
3094 | typedef int YTYPE; | |||
3095 | #endif | |||
3096 | static int do_floor(vorb *f, Mapping *map, int i, int n, float *target, YTYPE *finalY, uint8 *step2_flag) | |||
3097 | { | |||
3098 | int n2 = n >> 1; | |||
3099 | int s = map->chan[i].mux, floor; | |||
3100 | floor = map->submap_floor[s]; | |||
3101 | if (f->floor_types[floor] == 0) { | |||
3102 | return error(f, VORBIS_invalid_stream); | |||
3103 | } else { | |||
3104 | Floor1 *g = &f->floor_config[floor].floor1; | |||
3105 | int j,q; | |||
3106 | int lx = 0, ly = finalY[0] * g->floor1_multiplier; | |||
3107 | for (q=1; q < g->values; ++q) { | |||
3108 | j = g->sorted_order[q]; | |||
3109 | #ifndef STB_VORBIS_NO_DEFER_FLOOR | |||
3110 | if (finalY[j] >= 0) | |||
3111 | #else | |||
3112 | if (step2_flag[j]) | |||
3113 | #endif | |||
3114 | { | |||
3115 | int hy = finalY[j] * g->floor1_multiplier; | |||
3116 | int hx = g->Xlist[j]; | |||
3117 | draw_line(target, lx,ly, hx,hy, n2); | |||
3118 | lx = hx, ly = hy; | |||
3119 | } | |||
3120 | } | |||
3121 | if (lx < n2) | |||
3122 | // optimization of: draw_line(target, lx,ly, n,ly, n2); | |||
3123 | for (j=lx; j < n2; ++j) | |||
3124 | LINE_OP(target[j], inverse_db_table[ly])target[j] *= inverse_db_table[ly]; | |||
3125 | } | |||
3126 | return TRUE1; | |||
3127 | } | |||
3128 | ||||
3129 | static int vorbis_decode_initial(vorb *f, int *p_left_start, int *p_left_end, int *p_right_start, int *p_right_end, int *mode) | |||
3130 | { | |||
3131 | Mode *m; | |||
3132 | int i, n, prev, next, window_center; | |||
3133 | f->channel_buffer_start = f->channel_buffer_end = 0; | |||
3134 | ||||
3135 | retry: | |||
3136 | if (f->eof) return FALSE0; | |||
3137 | if (!maybe_start_packet(f)) | |||
3138 | return FALSE0; | |||
3139 | // check packet type | |||
3140 | if (get_bits(f,1) != 0) { | |||
3141 | if (IS_PUSH_MODE(f)((f)->push_mode)) | |||
3142 | return error(f,VORBIS_bad_packet_type); | |||
3143 | while (EOP(-1) != get8_packet(f)); | |||
3144 | goto retry; | |||
3145 | } | |||
3146 | ||||
3147 | if (f->alloc.alloc_buffer) | |||
3148 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3148)); | |||
3149 | ||||
3150 | i = get_bits(f, ilog(f->mode_count-1)); | |||
3151 | if (i == EOP(-1)) return FALSE0; | |||
3152 | if (i >= f->mode_count) return FALSE0; | |||
3153 | *mode = i; | |||
3154 | m = f->mode_config + i; | |||
3155 | if (m->blockflag) { | |||
3156 | n = f->blocksize_1; | |||
3157 | prev = get_bits(f,1); | |||
3158 | next = get_bits(f,1); | |||
3159 | } else { | |||
3160 | prev = next = 0; | |||
3161 | n = f->blocksize_0; | |||
3162 | } | |||
3163 | ||||
3164 | // WINDOWING | |||
3165 | ||||
3166 | window_center = n >> 1; | |||
3167 | if (m->blockflag && !prev) { | |||
3168 | *p_left_start = (n - f->blocksize_0) >> 2; | |||
3169 | *p_left_end = (n + f->blocksize_0) >> 2; | |||
3170 | } else { | |||
3171 | *p_left_start = 0; | |||
3172 | *p_left_end = window_center; | |||
3173 | } | |||
3174 | if (m->blockflag && !next) { | |||
3175 | *p_right_start = (n*3 - f->blocksize_0) >> 2; | |||
3176 | *p_right_end = (n*3 + f->blocksize_0) >> 2; | |||
3177 | } else { | |||
3178 | *p_right_start = window_center; | |||
3179 | *p_right_end = n; | |||
3180 | } | |||
3181 | return TRUE1; | |||
3182 | } | |||
3183 | ||||
3184 | static int vorbis_decode_packet_rest(vorb *f, int *len, Mode *m, int left_start, int left_end, int right_start, int right_end, int *p_left) | |||
3185 | { | |||
3186 | Mapping *map; | |||
3187 | int i,j,k,n,n2; | |||
3188 | int zero_channel[256]; | |||
3189 | int really_zero_channel[256]; | |||
3190 | int window_center; | |||
3191 | ||||
3192 | // WINDOWING | |||
3193 | ||||
3194 | n = f->blocksize[m->blockflag]; | |||
3195 | window_center = n >> 1; | |||
3196 | (void)window_center; | |||
3197 | ||||
3198 | map = &f->mapping[m->mapping]; | |||
3199 | ||||
3200 | // FLOORS | |||
3201 | n2 = n >> 1; | |||
3202 | ||||
3203 | stb_prof(1)(void)0; | |||
3204 | for (i=0; i < f->channels; ++i) { | |||
3205 | int s = map->chan[i].mux, floor; | |||
3206 | zero_channel[i] = FALSE0; | |||
3207 | floor = map->submap_floor[s]; | |||
3208 | if (f->floor_types[floor] == 0) { | |||
3209 | return error(f, VORBIS_invalid_stream); | |||
3210 | } else { | |||
3211 | Floor1 *g = &f->floor_config[floor].floor1; | |||
3212 | if (get_bits(f, 1)) { | |||
3213 | short *finalY; | |||
3214 | uint8 step2_flag[256]; | |||
3215 | static int range_list[4] = { 256, 128, 86, 64 }; | |||
3216 | int range = range_list[g->floor1_multiplier-1]; | |||
3217 | int offset = 2; | |||
3218 | finalY = f->finalY[i]; | |||
3219 | finalY[0] = get_bits(f, ilog(range)-1); | |||
3220 | finalY[1] = get_bits(f, ilog(range)-1); | |||
3221 | for (j=0; j < g->partitions; ++j) { | |||
3222 | int pclass = g->partition_class_list[j]; | |||
3223 | int cdim = g->class_dimensions[pclass]; | |||
3224 | int cbits = g->class_subclasses[pclass]; | |||
3225 | int csub = (1 << cbits)-1; | |||
3226 | int cval = 0; | |||
3227 | if (cbits) { | |||
3228 | Codebook *c = f->codebooks + g->class_masterbooks[pclass]; | |||
3229 | DECODE(cval,f,c)if (f->valid_bits < 10) prep_huffman(f); cval = f->acc & ((1 << 10) - 1); cval = c->fast_huffman[cval] ; if (cval >= 0) { int n = c->codeword_lengths[cval]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; cval = -1; } } else { cval = codebook_decode_scalar_raw(f,c); } if (c->sparse) cval = c ->sorted_values[cval];; | |||
3230 | } | |||
3231 | for (k=0; k < cdim; ++k) { | |||
3232 | int book = g->subclass_books[pclass][cval & csub]; | |||
3233 | cval = cval >> cbits; | |||
3234 | if (book >= 0) { | |||
3235 | int temp; | |||
3236 | Codebook *c = f->codebooks + book; | |||
3237 | DECODE(temp,f,c)if (f->valid_bits < 10) prep_huffman(f); temp = f->acc & ((1 << 10) - 1); temp = c->fast_huffman[temp] ; if (temp >= 0) { int n = c->codeword_lengths[temp]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; temp = -1; } } else { temp = codebook_decode_scalar_raw(f,c); } if (c->sparse) temp = c ->sorted_values[temp];; | |||
3238 | finalY[offset++] = temp; | |||
3239 | } else | |||
3240 | finalY[offset++] = 0; | |||
3241 | } | |||
3242 | } | |||
3243 | if (f->valid_bits == INVALID_BITS(-1)) goto error; // behavior according to spec | |||
3244 | step2_flag[0] = step2_flag[1] = 1; | |||
3245 | for (j=2; j < g->values; ++j) { | |||
3246 | int low, high, pred, highroom, lowroom, room, val; | |||
3247 | low = g->neighbors[j][0]; | |||
3248 | high = g->neighbors[j][1]; | |||
3249 | //neighbors(g->Xlist, j, &low, &high); | |||
3250 | pred = predict_point(g->Xlist[j], g->Xlist[low], g->Xlist[high], finalY[low], finalY[high]); | |||
3251 | val = finalY[j]; | |||
3252 | highroom = range - pred; | |||
3253 | lowroom = pred; | |||
3254 | if (highroom < lowroom) | |||
3255 | room = highroom * 2; | |||
3256 | else | |||
3257 | room = lowroom * 2; | |||
3258 | if (val) { | |||
3259 | step2_flag[low] = step2_flag[high] = 1; | |||
3260 | step2_flag[j] = 1; | |||
3261 | if (val >= room) | |||
3262 | if (highroom > lowroom) | |||
3263 | finalY[j] = val - lowroom + pred; | |||
3264 | else | |||
3265 | finalY[j] = pred - val + highroom - 1; | |||
3266 | else | |||
3267 | if (val & 1) | |||
3268 | finalY[j] = pred - ((val+1)>>1); | |||
3269 | else | |||
3270 | finalY[j] = pred + (val>>1); | |||
3271 | } else { | |||
3272 | step2_flag[j] = 0; | |||
3273 | finalY[j] = pred; | |||
3274 | } | |||
3275 | } | |||
3276 | ||||
3277 | #ifdef STB_VORBIS_NO_DEFER_FLOOR | |||
3278 | do_floor(f, map, i, n, f->floor_buffers[i], finalY, step2_flag); | |||
3279 | #else | |||
3280 | // defer final floor computation until _after_ residue | |||
3281 | for (j=0; j < g->values; ++j) { | |||
3282 | if (!step2_flag[j]) | |||
3283 | finalY[j] = -1; | |||
3284 | } | |||
3285 | #endif | |||
3286 | } else { | |||
3287 | error: | |||
3288 | zero_channel[i] = TRUE1; | |||
3289 | } | |||
3290 | // So we just defer everything else to later | |||
3291 | ||||
3292 | // at this point we've decoded the floor into buffer | |||
3293 | } | |||
3294 | } | |||
3295 | stb_prof(0)(void)0; | |||
3296 | // at this point we've decoded all floors | |||
3297 | ||||
3298 | if (f->alloc.alloc_buffer) | |||
3299 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3299)); | |||
3300 | ||||
3301 | // re-enable coupled channels if necessary | |||
3302 | memcpy(really_zero_channel, zero_channel, sizeof(really_zero_channel[0]) * f->channels); | |||
3303 | for (i=0; i < map->coupling_steps; ++i) | |||
3304 | if (!zero_channel[map->chan[i].magnitude] || !zero_channel[map->chan[i].angle]) { | |||
3305 | zero_channel[map->chan[i].magnitude] = zero_channel[map->chan[i].angle] = FALSE0; | |||
3306 | } | |||
3307 | ||||
3308 | // RESIDUE DECODE | |||
3309 | for (i=0; i < map->submaps; ++i) { | |||
3310 | float *residue_buffers[STB_VORBIS_MAX_CHANNELS16]; | |||
3311 | int r,t; | |||
3312 | uint8 do_not_decode[256]; | |||
3313 | int ch = 0; | |||
3314 | for (j=0; j < f->channels; ++j) { | |||
3315 | if (map->chan[j].mux == i) { | |||
3316 | if (zero_channel[j]) { | |||
3317 | do_not_decode[ch] = TRUE1; | |||
3318 | residue_buffers[ch] = NULL((void*)0); | |||
3319 | } else { | |||
3320 | do_not_decode[ch] = FALSE0; | |||
3321 | residue_buffers[ch] = f->channel_buffers[j]; | |||
3322 | } | |||
3323 | ++ch; | |||
3324 | } | |||
3325 | } | |||
3326 | r = map->submap_residue[i]; | |||
3327 | t = f->residue_types[r]; | |||
3328 | (void)t; | |||
3329 | decode_residue(f, residue_buffers, ch, n2, r, do_not_decode); | |||
3330 | } | |||
3331 | ||||
3332 | if (f->alloc.alloc_buffer) | |||
3333 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3333)); | |||
3334 | ||||
3335 | // INVERSE COUPLING | |||
3336 | stb_prof(14)(void)0; | |||
3337 | for (i = map->coupling_steps-1; i >= 0; --i) { | |||
3338 | int n2 = n >> 1; | |||
3339 | float *m = f->channel_buffers[map->chan[i].magnitude]; | |||
3340 | float *a = f->channel_buffers[map->chan[i].angle ]; | |||
3341 | for (j=0; j < n2; ++j) { | |||
3342 | float a2,m2; | |||
3343 | if (m[j] > 0) | |||
3344 | if (a[j] > 0) | |||
3345 | m2 = m[j], a2 = m[j] - a[j]; | |||
3346 | else | |||
3347 | a2 = m[j], m2 = m[j] + a[j]; | |||
3348 | else | |||
3349 | if (a[j] > 0) | |||
3350 | m2 = m[j], a2 = m[j] + a[j]; | |||
3351 | else | |||
3352 | a2 = m[j], m2 = m[j] - a[j]; | |||
3353 | m[j] = m2; | |||
3354 | a[j] = a2; | |||
3355 | } | |||
3356 | } | |||
3357 | ||||
3358 | // finish decoding the floors | |||
3359 | #ifndef STB_VORBIS_NO_DEFER_FLOOR | |||
3360 | stb_prof(15)(void)0; | |||
3361 | for (i=0; i < f->channels; ++i) { | |||
3362 | if (really_zero_channel[i]) { | |||
3363 | memset(f->channel_buffers[i], 0, sizeof(*f->channel_buffers[i]) * n2); | |||
3364 | } else { | |||
3365 | do_floor(f, map, i, n, f->channel_buffers[i], f->finalY[i], NULL((void*)0)); | |||
3366 | } | |||
3367 | } | |||
3368 | #else | |||
3369 | for (i=0; i < f->channels; ++i) { | |||
3370 | if (really_zero_channel[i]) { | |||
3371 | memset(f->channel_buffers[i], 0, sizeof(*f->channel_buffers[i]) * n2); | |||
3372 | } else { | |||
3373 | for (j=0; j < n2; ++j) | |||
3374 | f->channel_buffers[i][j] *= f->floor_buffers[i][j]; | |||
3375 | } | |||
3376 | } | |||
3377 | #endif | |||
3378 | ||||
3379 | // INVERSE MDCT | |||
3380 | stb_prof(16)(void)0; | |||
3381 | for (i=0; i < f->channels; ++i) | |||
3382 | inverse_mdct(f->channel_buffers[i], n, f, m->blockflag); | |||
3383 | stb_prof(0)(void)0; | |||
3384 | ||||
3385 | // this shouldn't be necessary, unless we exited on an error | |||
3386 | // and want to flush to get to the next packet | |||
3387 | flush_packet(f); | |||
3388 | ||||
3389 | if (f->first_decode) { | |||
3390 | // assume we start so first non-discarded sample is sample 0 | |||
3391 | // this isn't to spec, but spec would require us to read ahead | |||
3392 | // and decode the size of all current frames--could be done, | |||
3393 | // but presumably it's not a commonly used feature | |||
3394 | f->current_loc = -n2; // start of first frame is positioned for discard | |||
3395 | // we might have to discard samples "from" the next frame too, | |||
3396 | // if we're lapping a large block then a small at the start? | |||
3397 | f->discard_samples_deferred = n - right_end; | |||
3398 | f->current_loc_valid = TRUE1; | |||
3399 | f->first_decode = FALSE0; | |||
3400 | } else if (f->discard_samples_deferred) { | |||
3401 | left_start += f->discard_samples_deferred; | |||
3402 | *p_left = left_start; | |||
3403 | f->discard_samples_deferred = 0; | |||
3404 | } else if (f->previous_length == 0 && f->current_loc_valid) { | |||
3405 | // we're recovering from a seek... that means we're going to discard | |||
3406 | // the samples from this packet even though we know our position from | |||
3407 | // the last page header, so we need to update the position based on | |||
3408 | // the discarded samples here | |||
3409 | // but wait, the code below is going to add this in itself even | |||
3410 | // on a discard, so we don't need to do it here... | |||
3411 | } | |||
3412 | ||||
3413 | // check if we have ogg information about the sample # for this packet | |||
3414 | if (f->last_seg_which == f->end_seg_with_known_loc) { | |||
3415 | // if we have a valid current loc, and this is final: | |||
3416 | if (f->current_loc_valid && (f->page_flag & PAGEFLAG_last_page4)) { | |||
3417 | uint32 current_end = f->known_loc_for_packet - (n-right_end); | |||
3418 | // then let's infer the size of the (probably) short final frame | |||
3419 | if (current_end < f->current_loc + right_end) { | |||
3420 | if (current_end < f->current_loc) { | |||
3421 | // negative truncation, that's impossible! | |||
3422 | *len = 0; | |||
3423 | } else { | |||
3424 | *len = current_end - f->current_loc; | |||
3425 | } | |||
3426 | *len += left_start; | |||
3427 | f->current_loc += *len; | |||
3428 | return TRUE1; | |||
3429 | } | |||
3430 | } | |||
3431 | // otherwise, just set our sample loc | |||
3432 | // guess that the ogg granule pos refers to the _middle_ of the | |||
3433 | // last frame? | |||
3434 | // set f->current_loc to the position of left_start | |||
3435 | f->current_loc = f->known_loc_for_packet - (n2-left_start); | |||
3436 | f->current_loc_valid = TRUE1; | |||
3437 | } | |||
3438 | if (f->current_loc_valid) | |||
3439 | f->current_loc += (right_start - left_start); | |||
3440 | ||||
3441 | if (f->alloc.alloc_buffer) | |||
3442 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3442)); | |||
3443 | *len = right_end; // ignore samples after the window goes to 0 | |||
3444 | return TRUE1; | |||
3445 | } | |||
3446 | ||||
3447 | static int vorbis_decode_packet(vorb *f, int *len, int *p_left, int *p_right) | |||
3448 | { | |||
3449 | int mode, left_end, right_end; | |||
3450 | if (!vorbis_decode_initial(f, p_left, &left_end, p_right, &right_end, &mode)) return 0; | |||
3451 | return vorbis_decode_packet_rest(f, len, f->mode_config + mode, *p_left, left_end, *p_right, right_end, p_left); | |||
3452 | } | |||
3453 | ||||
3454 | static int vorbis_finish_frame(stb_vorbis *f, int len, int left, int right) | |||
3455 | { | |||
3456 | int prev,i,j; | |||
3457 | // we use right&left (the start of the right- and left-window sin()-regions) | |||
3458 | // to determine how much to return, rather than inferring from the rules | |||
3459 | // (same result, clearer code); 'left' indicates where our sin() window | |||
3460 | // starts, therefore where the previous window's right edge starts, and | |||
3461 | // therefore where to start mixing from the previous buffer. 'right' | |||
3462 | // indicates where our sin() ending-window starts, therefore that's where | |||
3463 | // we start saving, and where our returned-data ends. | |||
3464 | ||||
3465 | // mixin from previous window | |||
3466 | if (f->previous_length) { | |||
3467 | int i,j, n = f->previous_length; | |||
3468 | float *w = get_window(f, n); | |||
3469 | for (i=0; i < f->channels; ++i) { | |||
3470 | for (j=0; j < n; ++j) | |||
3471 | f->channel_buffers[i][left+j] = | |||
3472 | f->channel_buffers[i][left+j]*w[ j] + | |||
3473 | f->previous_window[i][ j]*w[n-1-j]; | |||
3474 | } | |||
3475 | } | |||
3476 | ||||
3477 | prev = f->previous_length; | |||
3478 | ||||
3479 | // last half of this data becomes previous window | |||
3480 | f->previous_length = len - right; | |||
3481 | ||||
3482 | // @OPTIMIZE: could avoid this copy by double-buffering the | |||
3483 | // output (flipping previous_window with channel_buffers), but | |||
3484 | // then previous_window would have to be 2x as large, and | |||
3485 | // channel_buffers couldn't be temp mem (although they're NOT | |||
3486 | // currently temp mem, they could be (unless we want to level | |||
3487 | // performance by spreading out the computation)) | |||
3488 | for (i=0; i < f->channels; ++i) | |||
3489 | for (j=0; right+j < len; ++j) | |||
3490 | f->previous_window[i][j] = f->channel_buffers[i][right+j]; | |||
3491 | ||||
3492 | if (!prev) | |||
3493 | // there was no previous packet, so this data isn't valid... | |||
3494 | // this isn't entirely true, only the would-have-overlapped data | |||
3495 | // isn't valid, but this seems to be what the spec requires | |||
3496 | return 0; | |||
3497 | ||||
3498 | // truncate a short frame | |||
3499 | if (len < right) right = len; | |||
3500 | ||||
3501 | f->samples_output += right-left; | |||
3502 | ||||
3503 | return right - left; | |||
3504 | } | |||
3505 | ||||
3506 | static void vorbis_pump_first_frame(stb_vorbis *f) | |||
3507 | { | |||
3508 | int len, right, left; | |||
3509 | if (vorbis_decode_packet(f, &len, &left, &right)) | |||
3510 | vorbis_finish_frame(f, len, left, right); | |||
3511 | } | |||
3512 | ||||
3513 | #ifndef STB_VORBIS_NO_PUSHDATA_API | |||
3514 | static int is_whole_packet_present(stb_vorbis *f, int end_page) | |||
3515 | { | |||
3516 | // make sure that we have the packet available before continuing... | |||
3517 | // this requires a full ogg parse, but we know we can fetch from f->stream | |||
3518 | ||||
3519 | // instead of coding this out explicitly, we could save the current read state, | |||
3520 | // read the next packet with get8() until end-of-packet, check f->eof, then | |||
3521 | // reset the state? but that would be slower, esp. since we'd have over 256 bytes | |||
3522 | // of state to restore (primarily the page segment table) | |||
3523 | ||||
3524 | int s = f->next_seg, first = TRUE1; | |||
3525 | uint8 *p = f->stream; | |||
3526 | ||||
3527 | if (s != -1) { // if we're not starting the packet with a 'continue on next page' flag | |||
3528 | for (; s < f->segment_count; ++s) { | |||
3529 | p += f->segments[s]; | |||
3530 | if (f->segments[s] < 255) // stop at first short segment | |||
3531 | break; | |||
3532 | } | |||
3533 | // either this continues, or it ends it... | |||
3534 | if (end_page) | |||
3535 | if (s < f->segment_count-1) return error(f, VORBIS_invalid_stream); | |||
3536 | if (s == f->segment_count) | |||
3537 | s = -1; // set 'crosses page' flag | |||
3538 | if (p > f->stream_end) return error(f, VORBIS_need_more_data); | |||
3539 | first = FALSE0; | |||
3540 | } | |||
3541 | for (; s == -1;) { | |||
3542 | uint8 *q; | |||
3543 | int n; | |||
3544 | ||||
3545 | // check that we have the page header ready | |||
3546 | if (p + 26 >= f->stream_end) return error(f, VORBIS_need_more_data); | |||
3547 | // validate the page | |||
3548 | if (memcmp(p, ogg_page_header, 4)) return error(f, VORBIS_invalid_stream); | |||
3549 | if (p[4] != 0) return error(f, VORBIS_invalid_stream); | |||
3550 | if (first) { // the first segment must NOT have 'continued_packet', later ones MUST | |||
3551 | if (f->previous_length) | |||
3552 | if ((p[5] & PAGEFLAG_continued_packet1)) return error(f, VORBIS_invalid_stream); | |||
3553 | // if no previous length, we're resynching, so we can come in on a continued-packet, | |||
3554 | // which we'll just drop | |||
3555 | } else { | |||
3556 | if (!(p[5] & PAGEFLAG_continued_packet1)) return error(f, VORBIS_invalid_stream); | |||
3557 | } | |||
3558 | n = p[26]; // segment counts | |||
3559 | q = p+27; // q points to segment table | |||
3560 | p = q + n; // advance past header | |||
3561 | // make sure we've read the segment table | |||
3562 | if (p > f->stream_end) return error(f, VORBIS_need_more_data); | |||
3563 | for (s=0; s < n; ++s) { | |||
3564 | p += q[s]; | |||
3565 | if (q[s] < 255) | |||
3566 | break; | |||
3567 | } | |||
3568 | if (end_page) | |||
3569 | if (s < n-1) return error(f, VORBIS_invalid_stream); | |||
3570 | if (s == f->segment_count) | |||
3571 | s = -1; // set 'crosses page' flag | |||
3572 | if (p > f->stream_end) return error(f, VORBIS_need_more_data); | |||
3573 | first = FALSE0; | |||
3574 | } | |||
3575 | return TRUE1; | |||
3576 | } | |||
3577 | #endif // !STB_VORBIS_NO_PUSHDATA_API | |||
3578 | ||||
3579 | static int start_decoder(vorb *f) | |||
3580 | { | |||
3581 | uint8 header[6], x,y; | |||
3582 | int len,i,j,k, max_submaps = 0; | |||
3583 | int longest_floorlist=0; | |||
3584 | ||||
3585 | // first page, first packet | |||
3586 | ||||
3587 | if (!start_page(f)) return FALSE0; | |||
3588 | // validate page flag | |||
3589 | if (!(f->page_flag & PAGEFLAG_first_page2)) return error(f, VORBIS_invalid_first_page); | |||
3590 | if (f->page_flag & PAGEFLAG_last_page4) return error(f, VORBIS_invalid_first_page); | |||
3591 | if (f->page_flag & PAGEFLAG_continued_packet1) return error(f, VORBIS_invalid_first_page); | |||
3592 | // check for expected packet length | |||
3593 | if (f->segment_count != 1) return error(f, VORBIS_invalid_first_page); | |||
3594 | if (f->segments[0] != 30) return error(f, VORBIS_invalid_first_page); | |||
3595 | // read packet | |||
3596 | // check packet header | |||
3597 | if (get8(f) != VORBIS_packet_id) return error(f, VORBIS_invalid_first_page); | |||
3598 | if (!getn(f, header, 6)) return error(f, VORBIS_unexpected_eof); | |||
3599 | if (!vorbis_validate(header)) return error(f, VORBIS_invalid_first_page); | |||
3600 | // vorbis_version | |||
3601 | if (get32(f) != 0) return error(f, VORBIS_invalid_first_page); | |||
3602 | f->channels = get8(f); if (!f->channels) return error(f, VORBIS_invalid_first_page); | |||
3603 | if (f->channels > STB_VORBIS_MAX_CHANNELS16) return error(f, VORBIS_too_many_channels); | |||
3604 | f->sample_rate = get32(f); if (!f->sample_rate) return error(f, VORBIS_invalid_first_page); | |||
3605 | get32(f); // bitrate_maximum | |||
3606 | get32(f); // bitrate_nominal | |||
3607 | get32(f); // bitrate_minimum | |||
3608 | x = get8(f); | |||
3609 | { int log0,log1; | |||
3610 | log0 = x & 15; | |||
3611 | log1 = x >> 4; | |||
3612 | f->blocksize_0 = 1 << log0; | |||
3613 | f->blocksize_1 = 1 << log1; | |||
3614 | if (log0 < 6 || log0 > 13) return error(f, VORBIS_invalid_setup); | |||
3615 | if (log1 < 6 || log1 > 13) return error(f, VORBIS_invalid_setup); | |||
3616 | if (log0 > log1) return error(f, VORBIS_invalid_setup); | |||
3617 | } | |||
3618 | ||||
3619 | // framing_flag | |||
3620 | x = get8(f); | |||
3621 | if (!(x & 1)) return error(f, VORBIS_invalid_first_page); | |||
3622 | ||||
3623 | // second packet! | |||
3624 | if (!start_page(f)) return FALSE0; | |||
3625 | ||||
3626 | if (!start_packet(f)) return FALSE0; | |||
3627 | do { | |||
3628 | len = next_segment(f); | |||
3629 | skip(f, len); | |||
3630 | f->bytes_in_seg = 0; | |||
3631 | } while (len); | |||
3632 | ||||
3633 | // third packet! | |||
3634 | if (!start_packet(f)) return FALSE0; | |||
3635 | ||||
3636 | #ifndef STB_VORBIS_NO_PUSHDATA_API | |||
3637 | if (IS_PUSH_MODE(f)((f)->push_mode)) { | |||
3638 | if (!is_whole_packet_present(f, TRUE1)) { | |||
3639 | // convert error in ogg header to write type | |||
3640 | if (f->error == VORBIS_invalid_stream) | |||
3641 | f->error = VORBIS_invalid_setup; | |||
3642 | return FALSE0; | |||
3643 | } | |||
3644 | } | |||
3645 | #endif | |||
3646 | ||||
3647 | crc32_init(); // always init it, to avoid multithread race conditions | |||
3648 | ||||
3649 | if (get8_packet(f) != VORBIS_packet_setup) return error(f, VORBIS_invalid_setup); | |||
3650 | for (i=0; i < 6; ++i) header[i] = get8_packet(f); | |||
3651 | if (!vorbis_validate(header)) return error(f, VORBIS_invalid_setup); | |||
3652 | ||||
3653 | // codebooks | |||
3654 | ||||
3655 | f->codebook_count = get_bits(f,8) + 1; | |||
3656 | f->codebooks = (Codebook *) setup_malloc(f, sizeof(*f->codebooks) * f->codebook_count); | |||
3657 | if (f->codebooks == NULL((void*)0)) return error(f, VORBIS_outofmem); | |||
3658 | memset(f->codebooks, 0, sizeof(*f->codebooks) * f->codebook_count); | |||
3659 | for (i=0; i < f->codebook_count; ++i) { | |||
3660 | uint32 *values; | |||
3661 | int ordered, sorted_count; | |||
3662 | int total=0; | |||
3663 | uint8 *lengths; | |||
3664 | Codebook *c = f->codebooks+i; | |||
3665 | x = get_bits(f, 8); if (x != 0x42) return error(f, VORBIS_invalid_setup); | |||
3666 | x = get_bits(f, 8); if (x != 0x43) return error(f, VORBIS_invalid_setup); | |||
3667 | x = get_bits(f, 8); if (x != 0x56) return error(f, VORBIS_invalid_setup); | |||
3668 | x = get_bits(f, 8); | |||
3669 | c->dimensions = (get_bits(f, 8)<<8) + x; | |||
3670 | x = get_bits(f, 8); | |||
3671 | y = get_bits(f, 8); | |||
3672 | c->entries = (get_bits(f, 8)<<16) + (y<<8) + x; | |||
3673 | ordered = get_bits(f,1); | |||
3674 | c->sparse = ordered ? 0 : get_bits(f,1); | |||
3675 | ||||
3676 | if (c->sparse) | |||
3677 | lengths = (uint8 *) setup_temp_malloc(f, c->entries); | |||
3678 | else | |||
3679 | lengths = c->codeword_lengths = (uint8 *) setup_malloc(f, c->entries); | |||
3680 | ||||
3681 | if (!lengths) return error(f, VORBIS_outofmem); | |||
3682 | ||||
3683 | if (ordered) { | |||
3684 | int current_entry = 0; | |||
3685 | int current_length = get_bits(f,5) + 1; | |||
3686 | while (current_entry < c->entries) { | |||
3687 | int limit = c->entries - current_entry; | |||
3688 | int n = get_bits(f, ilog(limit)); | |||
3689 | if (current_entry + n > (int) c->entries) { return error(f, VORBIS_invalid_setup); } | |||
3690 | memset(lengths + current_entry, current_length, n); | |||
3691 | current_entry += n; | |||
3692 | ++current_length; | |||
3693 | } | |||
3694 | } else { | |||
3695 | for (j=0; j < c->entries; ++j) { | |||
3696 | int present = c->sparse ? get_bits(f,1) : 1; | |||
3697 | if (present) { | |||
3698 | lengths[j] = get_bits(f, 5) + 1; | |||
3699 | ++total; | |||
3700 | } else { | |||
3701 | lengths[j] = NO_CODE255; | |||
3702 | } | |||
3703 | } | |||
3704 | } | |||
3705 | ||||
3706 | if (c->sparse && total >= c->entries >> 2) { | |||
3707 | // convert sparse items to non-sparse! | |||
3708 | if (c->entries > (int) f->setup_temp_memory_required) | |||
3709 | f->setup_temp_memory_required = c->entries; | |||
3710 | ||||
3711 | c->codeword_lengths = (uint8 *) setup_malloc(f, c->entries); | |||
3712 | memcpy(c->codeword_lengths, lengths, c->entries); | |||
3713 | setup_temp_free(f, lengths, c->entries); // note this is only safe if there have been no intervening temp mallocs! | |||
3714 | lengths = c->codeword_lengths; | |||
3715 | c->sparse = 0; | |||
3716 | } | |||
3717 | ||||
3718 | // compute the size of the sorted tables | |||
3719 | if (c->sparse) { | |||
3720 | sorted_count = total; | |||
3721 | //assert(total != 0); | |||
3722 | } else { | |||
3723 | sorted_count = 0; | |||
3724 | #ifndef STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH | |||
3725 | for (j=0; j < c->entries; ++j) | |||
3726 | if (lengths[j] > STB_VORBIS_FAST_HUFFMAN_LENGTH10 && lengths[j] != NO_CODE255) | |||
3727 | ++sorted_count; | |||
3728 | #endif | |||
3729 | } | |||
3730 | ||||
3731 | c->sorted_entries = sorted_count; | |||
3732 | values = NULL((void*)0); | |||
3733 | ||||
3734 | if (!c->sparse) { | |||
3735 | c->codewords = (uint32 *) setup_malloc(f, sizeof(c->codewords[0]) * c->entries); | |||
3736 | if (!c->codewords) return error(f, VORBIS_outofmem); | |||
3737 | } else { | |||
3738 | unsigned int size; | |||
3739 | if (c->sorted_entries) { | |||
3740 | c->codeword_lengths = (uint8 *) setup_malloc(f, c->sorted_entries); | |||
3741 | if (!c->codeword_lengths) return error(f, VORBIS_outofmem); | |||
3742 | c->codewords = (uint32 *) setup_temp_malloc(f, sizeof(*c->codewords) * c->sorted_entries); | |||
3743 | if (!c->codewords) return error(f, VORBIS_outofmem); | |||
3744 | values = (uint32 *) setup_temp_malloc(f, sizeof(*values) * c->sorted_entries); | |||
3745 | if (!values) return error(f, VORBIS_outofmem); | |||
3746 | } | |||
3747 | size = c->entries + (sizeof(*c->codewords) + sizeof(*values)) * c->sorted_entries; | |||
3748 | if (size > f->setup_temp_memory_required) | |||
3749 | f->setup_temp_memory_required = size; | |||
3750 | } | |||
3751 | ||||
3752 | if (!compute_codewords(c, lengths, c->entries, values)) { | |||
3753 | if (c->sparse) setup_temp_free(f, values, 0); | |||
3754 | return error(f, VORBIS_invalid_setup); | |||
3755 | } | |||
3756 | ||||
3757 | if (c->sorted_entries) { | |||
3758 | // allocate an extra slot for sentinels | |||
3759 | c->sorted_codewords = (uint32 *) setup_malloc(f, sizeof(*c->sorted_codewords) * (c->sorted_entries+1)); | |||
3760 | // allocate an extra slot at the front so that c->sorted_values[-1] is defined | |||
3761 | // so that we can catch that case without an extra if | |||
3762 | c->sorted_values = ( int *) setup_malloc(f, sizeof(*c->sorted_values ) * (c->sorted_entries+1)); | |||
3763 | if (c->sorted_values) { ++c->sorted_values; c->sorted_values[-1] = -1; } | |||
3764 | compute_sorted_huffman(c, lengths, values); | |||
3765 | } | |||
3766 | ||||
3767 | if (c->sparse) { | |||
3768 | setup_temp_free(f, values, sizeof(*values)*c->sorted_entries); | |||
3769 | setup_temp_free(f, c->codewords, sizeof(*c->codewords)*c->sorted_entries); | |||
3770 | setup_temp_free(f, lengths, c->entries); | |||
3771 | c->codewords = NULL((void*)0); | |||
3772 | } | |||
3773 | ||||
3774 | compute_accelerated_huffman(c); | |||
3775 | ||||
3776 | c->lookup_type = get_bits(f, 4); | |||
3777 | if (c->lookup_type > 2) return error(f, VORBIS_invalid_setup); | |||
3778 | if (c->lookup_type > 0) { | |||
3779 | uint16 *mults; | |||
3780 | c->minimum_value = float32_unpack(get_bits(f, 32)); | |||
3781 | c->delta_value = float32_unpack(get_bits(f, 32)); | |||
3782 | c->value_bits = get_bits(f, 4)+1; | |||
3783 | c->sequence_p = get_bits(f,1); | |||
3784 | if (c->lookup_type == 1) { | |||
3785 | c->lookup_values = lookup1_values(c->entries, c->dimensions); | |||
3786 | } else { | |||
3787 | c->lookup_values = c->entries * c->dimensions; | |||
3788 | } | |||
3789 | mults = (uint16 *) setup_temp_malloc(f, sizeof(mults[0]) * c->lookup_values); | |||
3790 | if (mults == NULL((void*)0)) return error(f, VORBIS_outofmem); | |||
3791 | for (j=0; j < (int) c->lookup_values; ++j) { | |||
3792 | int q = get_bits(f, c->value_bits); | |||
3793 | if (q == EOP(-1)) { setup_temp_free(f,mults,sizeof(mults[0])*c->lookup_values); return error(f, VORBIS_invalid_setup); } | |||
3794 | mults[j] = q; | |||
3795 | } | |||
3796 | ||||
3797 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
3798 | if (c->lookup_type == 1) { | |||
3799 | int len, sparse = c->sparse; | |||
3800 | // pre-expand the lookup1-style multiplicands, to avoid a divide in the inner loop | |||
3801 | if (sparse) { | |||
3802 | if (c->sorted_entries == 0) goto skip; | |||
3803 | c->multiplicands = (codetype *) setup_malloc(f, sizeof(c->multiplicands[0]) * c->sorted_entries * c->dimensions); | |||
3804 | } else | |||
3805 | c->multiplicands = (codetype *) setup_malloc(f, sizeof(c->multiplicands[0]) * c->entries * c->dimensions); | |||
3806 | if (c->multiplicands == NULL((void*)0)) { setup_temp_free(f,mults,sizeof(mults[0])*c->lookup_values); return error(f, VORBIS_outofmem); } | |||
3807 | len = sparse ? c->sorted_entries : c->entries; | |||
3808 | for (j=0; j < len; ++j) { | |||
3809 | int z = sparse ? c->sorted_values[j] : j, div=1; | |||
3810 | for (k=0; k < c->dimensions; ++k) { | |||
3811 | int off = (z / div) % c->lookup_values; | |||
3812 | c->multiplicands[j*c->dimensions + k] = | |||
3813 | #ifndef STB_VORBIS_CODEBOOK_FLOATS | |||
3814 | mults[off]; | |||
3815 | #else | |||
3816 | mults[off]*c->delta_value + c->minimum_value; | |||
3817 | // in this case (and this case only) we could pre-expand c->sequence_p, | |||
3818 | // and throw away the decode logic for it; have to ALSO do | |||
3819 | // it in the case below, but it can only be done if | |||
3820 | // STB_VORBIS_CODEBOOK_FLOATS | |||
3821 | // !STB_VORBIS_DIVIDES_IN_CODEBOOK | |||
3822 | #endif | |||
3823 | div *= c->lookup_values; | |||
3824 | } | |||
3825 | } | |||
3826 | setup_temp_free(f, mults,sizeof(mults[0])*c->lookup_values); | |||
3827 | c->lookup_type = 2; | |||
3828 | } | |||
3829 | else | |||
3830 | #endif | |||
3831 | { | |||
3832 | c->multiplicands = (codetype *) setup_malloc(f, sizeof(c->multiplicands[0]) * c->lookup_values); | |||
3833 | #ifndef STB_VORBIS_CODEBOOK_FLOATS | |||
3834 | memcpy(c->multiplicands, mults, sizeof(c->multiplicands[0]) * c->lookup_values); | |||
3835 | #else | |||
3836 | for (j=0; j < (int) c->lookup_values; ++j) | |||
3837 | c->multiplicands[j] = mults[j] * c->delta_value + c->minimum_value; | |||
3838 | setup_temp_free(f, mults,sizeof(mults[0])*c->lookup_values); | |||
3839 | #endif | |||
3840 | } | |||
3841 | skip:; | |||
3842 | ||||
3843 | #ifdef STB_VORBIS_CODEBOOK_FLOATS | |||
3844 | if (c->lookup_type == 2 && c->sequence_p) { | |||
3845 | for (j=1; j < (int) c->lookup_values; ++j) | |||
3846 | c->multiplicands[j] = c->multiplicands[j-1]; | |||
3847 | c->sequence_p = 0; | |||
3848 | } | |||
3849 | #endif | |||
3850 | } | |||
3851 | } | |||
3852 | ||||
3853 | // time domain transfers (notused) | |||
3854 | ||||
3855 | x = get_bits(f, 6) + 1; | |||
3856 | for (i=0; i < x; ++i) { | |||
3857 | uint32 z = get_bits(f, 16); | |||
3858 | if (z != 0) return error(f, VORBIS_invalid_setup); | |||
3859 | } | |||
3860 | ||||
3861 | // Floors | |||
3862 | f->floor_count = get_bits(f, 6)+1; | |||
3863 | f->floor_config = (Floor *) setup_malloc(f, f->floor_count * sizeof(*f->floor_config)); | |||
3864 | for (i=0; i < f->floor_count; ++i) { | |||
3865 | f->floor_types[i] = get_bits(f, 16); | |||
3866 | if (f->floor_types[i] > 1) return error(f, VORBIS_invalid_setup); | |||
3867 | if (f->floor_types[i] == 0) { | |||
3868 | Floor0 *g = &f->floor_config[i].floor0; | |||
3869 | g->order = get_bits(f,8); | |||
3870 | g->rate = get_bits(f,16); | |||
3871 | g->bark_map_size = get_bits(f,16); | |||
3872 | g->amplitude_bits = get_bits(f,6); | |||
3873 | g->amplitude_offset = get_bits(f,8); | |||
3874 | g->number_of_books = get_bits(f,4) + 1; | |||
3875 | for (j=0; j < g->number_of_books; ++j) | |||
3876 | g->book_list[j] = get_bits(f,8); | |||
3877 | return error(f, VORBIS_feature_not_supported); | |||
3878 | } else { | |||
3879 | Point p[31*8+2]; | |||
3880 | Floor1 *g = &f->floor_config[i].floor1; | |||
3881 | int max_class = -1; | |||
3882 | g->partitions = get_bits(f, 5); | |||
3883 | for (j=0; j < g->partitions; ++j) { | |||
3884 | g->partition_class_list[j] = get_bits(f, 4); | |||
3885 | if (g->partition_class_list[j] > max_class) | |||
3886 | max_class = g->partition_class_list[j]; | |||
3887 | } | |||
3888 | for (j=0; j <= max_class; ++j) { | |||
3889 | g->class_dimensions[j] = get_bits(f, 3)+1; | |||
3890 | g->class_subclasses[j] = get_bits(f, 2); | |||
3891 | if (g->class_subclasses[j]) { | |||
3892 | g->class_masterbooks[j] = get_bits(f, 8); | |||
3893 | if (g->class_masterbooks[j] >= f->codebook_count) return error(f, VORBIS_invalid_setup); | |||
3894 | } | |||
3895 | for (k=0; k < 1 << g->class_subclasses[j]; ++k) { | |||
3896 | g->subclass_books[j][k] = get_bits(f,8)-1; | |||
3897 | if (g->subclass_books[j][k] >= f->codebook_count) return error(f, VORBIS_invalid_setup); | |||
3898 | } | |||
3899 | } | |||
3900 | g->floor1_multiplier = get_bits(f,2)+1; | |||
3901 | g->rangebits = get_bits(f,4); | |||
3902 | g->Xlist[0] = 0; | |||
3903 | g->Xlist[1] = 1 << g->rangebits; | |||
3904 | g->values = 2; | |||
3905 | for (j=0; j < g->partitions; ++j) { | |||
3906 | int c = g->partition_class_list[j]; | |||
3907 | for (k=0; k < g->class_dimensions[c]; ++k) { | |||
3908 | g->Xlist[g->values] = get_bits(f, g->rangebits); | |||
3909 | ++g->values; | |||
3910 | } | |||
3911 | } | |||
3912 | // precompute the sorting | |||
3913 | for (j=0; j < g->values; ++j) { | |||
3914 | p[j].x = g->Xlist[j]; | |||
3915 | p[j].y = j; | |||
3916 | } | |||
3917 | qsort(p, g->values, sizeof(p[0]), point_compare); | |||
3918 | for (j=0; j < g->values; ++j) | |||
3919 | g->sorted_order[j] = (uint8) p[j].y; | |||
3920 | // precompute the neighbors | |||
3921 | for (j=2; j < g->values; ++j) { | |||
3922 | int low,hi; | |||
3923 | neighbors(g->Xlist, j, &low,&hi); | |||
3924 | g->neighbors[j][0] = low; | |||
3925 | g->neighbors[j][1] = hi; | |||
3926 | } | |||
3927 | ||||
3928 | if (g->values > longest_floorlist) | |||
3929 | longest_floorlist = g->values; | |||
3930 | } | |||
3931 | } | |||
3932 | ||||
3933 | // Residue | |||
3934 | f->residue_count = get_bits(f, 6)+1; | |||
3935 | f->residue_config = (Residue *) setup_malloc(f, f->residue_count * sizeof(*f->residue_config)); | |||
3936 | for (i=0; i < f->residue_count; ++i) { | |||
3937 | uint8 residue_cascade[64]; | |||
3938 | Residue *r = f->residue_config+i; | |||
3939 | f->residue_types[i] = get_bits(f, 16); | |||
3940 | if (f->residue_types[i] > 2) return error(f, VORBIS_invalid_setup); | |||
3941 | r->begin = get_bits(f, 24); | |||
3942 | r->end = get_bits(f, 24); | |||
3943 | r->part_size = get_bits(f,24)+1; | |||
3944 | r->classifications = get_bits(f,6)+1; | |||
3945 | r->classbook = get_bits(f,8); | |||
3946 | for (j=0; j < r->classifications; ++j) { | |||
3947 | uint8 high_bits=0; | |||
3948 | uint8 low_bits=get_bits(f,3); | |||
3949 | if (get_bits(f,1)) | |||
3950 | high_bits = get_bits(f,5); | |||
3951 | residue_cascade[j] = high_bits*8 + low_bits; | |||
3952 | } | |||
3953 | r->residue_books = (short (*)[8]) setup_malloc(f, sizeof(r->residue_books[0]) * r->classifications); | |||
3954 | for (j=0; j < r->classifications; ++j) { | |||
3955 | for (k=0; k < 8; ++k) { | |||
3956 | if (residue_cascade[j] & (1 << k)) { | |||
3957 | r->residue_books[j][k] = get_bits(f, 8); | |||
3958 | if (r->residue_books[j][k] >= f->codebook_count) return error(f, VORBIS_invalid_setup); | |||
3959 | } else { | |||
3960 | r->residue_books[j][k] = -1; | |||
3961 | } | |||
3962 | } | |||
3963 | } | |||
3964 | // precompute the classifications[] array to avoid inner-loop mod/divide | |||
3965 | // call it 'classdata' since we already have r->classifications | |||
3966 | r->classdata = (uint8 **) setup_malloc(f, sizeof(*r->classdata) * f->codebooks[r->classbook].entries); | |||
3967 | if (!r->classdata) return error(f, VORBIS_outofmem); | |||
3968 | memset(r->classdata, 0, sizeof(*r->classdata) * f->codebooks[r->classbook].entries); | |||
3969 | for (j=0; j < f->codebooks[r->classbook].entries; ++j) { | |||
3970 | int classwords = f->codebooks[r->classbook].dimensions; | |||
3971 | int temp = j; | |||
3972 | r->classdata[j] = (uint8 *) setup_malloc(f, sizeof(r->classdata[j][0]) * classwords); | |||
3973 | for (k=classwords-1; k >= 0; --k) { | |||
3974 | r->classdata[j][k] = temp % r->classifications; | |||
3975 | temp /= r->classifications; | |||
3976 | } | |||
3977 | } | |||
3978 | } | |||
3979 | ||||
3980 | f->mapping_count = get_bits(f,6)+1; | |||
3981 | f->mapping = (Mapping *) setup_malloc(f, f->mapping_count * sizeof(*f->mapping)); | |||
3982 | for (i=0; i < f->mapping_count; ++i) { | |||
3983 | Mapping *m = f->mapping + i; | |||
3984 | int mapping_type = get_bits(f,16); | |||
3985 | if (mapping_type != 0) return error(f, VORBIS_invalid_setup); | |||
3986 | m->chan = (MappingChannel *) setup_malloc(f, f->channels * sizeof(*m->chan)); | |||
3987 | if (get_bits(f,1)) | |||
3988 | m->submaps = get_bits(f,4); | |||
3989 | else | |||
3990 | m->submaps = 1; | |||
3991 | if (m->submaps > max_submaps) | |||
3992 | max_submaps = m->submaps; | |||
3993 | if (get_bits(f,1)) { | |||
3994 | m->coupling_steps = get_bits(f,8)+1; | |||
3995 | for (k=0; k < m->coupling_steps; ++k) { | |||
3996 | m->chan[k].magnitude = get_bits(f, ilog(f->channels)-1); | |||
3997 | m->chan[k].angle = get_bits(f, ilog(f->channels)-1); | |||
3998 | if (m->chan[k].magnitude >= f->channels) return error(f, VORBIS_invalid_setup); | |||
3999 | if (m->chan[k].angle >= f->channels) return error(f, VORBIS_invalid_setup); | |||
4000 | if (m->chan[k].magnitude == m->chan[k].angle) return error(f, VORBIS_invalid_setup); | |||
4001 | } | |||
4002 | } else | |||
4003 | m->coupling_steps = 0; | |||
4004 | ||||
4005 | // reserved field | |||
4006 | if (get_bits(f,2)) return error(f, VORBIS_invalid_setup); | |||
4007 | if (m->submaps > 1) { | |||
4008 | for (j=0; j < f->channels; ++j) { | |||
4009 | m->chan[j].mux = get_bits(f, 4); | |||
4010 | if (m->chan[j].mux >= m->submaps) return error(f, VORBIS_invalid_setup); | |||
4011 | } | |||
4012 | } else | |||
4013 | // @SPECIFICATION: this case is missing from the spec | |||
4014 | for (j=0; j < f->channels; ++j) | |||
4015 | m->chan[j].mux = 0; | |||
4016 | ||||
4017 | for (j=0; j < m->submaps; ++j) { | |||
4018 | get_bits(f,8); // discard | |||
4019 | m->submap_floor[j] = get_bits(f,8); | |||
4020 | m->submap_residue[j] = get_bits(f,8); | |||
4021 | if (m->submap_floor[j] >= f->floor_count) return error(f, VORBIS_invalid_setup); | |||
4022 | if (m->submap_residue[j] >= f->residue_count) return error(f, VORBIS_invalid_setup); | |||
4023 | } | |||
4024 | } | |||
4025 | ||||
4026 | // Modes | |||
4027 | f->mode_count = get_bits(f, 6)+1; | |||
4028 | for (i=0; i < f->mode_count; ++i) { | |||
4029 | Mode *m = f->mode_config+i; | |||
4030 | m->blockflag = get_bits(f,1); | |||
4031 | m->windowtype = get_bits(f,16); | |||
4032 | m->transformtype = get_bits(f,16); | |||
4033 | m->mapping = get_bits(f,8); | |||
4034 | if (m->windowtype != 0) return error(f, VORBIS_invalid_setup); | |||
4035 | if (m->transformtype != 0) return error(f, VORBIS_invalid_setup); | |||
4036 | if (m->mapping >= f->mapping_count) return error(f, VORBIS_invalid_setup); | |||
4037 | } | |||
4038 | ||||
4039 | flush_packet(f); | |||
4040 | ||||
4041 | f->previous_length = 0; | |||
4042 | ||||
4043 | for (i=0; i < f->channels; ++i) { | |||
4044 | f->channel_buffers[i] = (float *) setup_malloc(f, sizeof(float) * f->blocksize_1); | |||
4045 | f->previous_window[i] = (float *) setup_malloc(f, sizeof(float) * f->blocksize_1/2); | |||
4046 | f->finalY[i] = (int16 *) setup_malloc(f, sizeof(int16) * longest_floorlist); | |||
4047 | #ifdef STB_VORBIS_NO_DEFER_FLOOR | |||
4048 | f->floor_buffers[i] = (float *) setup_malloc(f, sizeof(float) * f->blocksize_1/2); | |||
4049 | #endif | |||
4050 | } | |||
4051 | ||||
4052 | if (!init_blocksize(f, 0, f->blocksize_0)) return FALSE0; | |||
4053 | if (!init_blocksize(f, 1, f->blocksize_1)) return FALSE0; | |||
4054 | f->blocksize[0] = f->blocksize_0; | |||
4055 | f->blocksize[1] = f->blocksize_1; | |||
4056 | ||||
4057 | #ifdef STB_VORBIS_DIVIDE_TABLE | |||
4058 | if (integer_divide_table[1][1]==0) | |||
4059 | for (i=0; i < DIVTAB_NUMER; ++i) | |||
4060 | for (j=1; j < DIVTAB_DENOM; ++j) | |||
4061 | integer_divide_table[i][j] = i / j; | |||
4062 | #endif | |||
4063 | ||||
4064 | // compute how much temporary memory is needed | |||
4065 | ||||
4066 | // 1. | |||
4067 | { | |||
4068 | uint32 imdct_mem = (f->blocksize_1 * sizeof(float) >> 1); | |||
4069 | uint32 classify_mem; | |||
4070 | int i,max_part_read=0; | |||
4071 | for (i=0; i < f->residue_count; ++i) { | |||
4072 | Residue *r = f->residue_config + i; | |||
4073 | int n_read = r->end - r->begin; | |||
4074 | int part_read = n_read / r->part_size; | |||
4075 | if (part_read > max_part_read) | |||
4076 | max_part_read = part_read; | |||
4077 | } | |||
4078 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE | |||
4079 | classify_mem = f->channels * (sizeof(void*) + max_part_read * sizeof(uint8 *)); | |||
4080 | #else | |||
4081 | classify_mem = f->channels * (sizeof(void*) + max_part_read * sizeof(int *)); | |||
4082 | #endif | |||
4083 | ||||
4084 | f->temp_memory_required = classify_mem; | |||
4085 | if (imdct_mem > f->temp_memory_required) | |||
4086 | f->temp_memory_required = imdct_mem; | |||
4087 | } | |||
4088 | ||||
4089 | f->first_decode = TRUE1; | |||
4090 | ||||
4091 | if (f->alloc.alloc_buffer) { | |||
4092 | assert(f->temp_offset == f->alloc.alloc_buffer_length_in_bytes)((f->temp_offset == f->alloc.alloc_buffer_length_in_bytes ) ? (void)0 : _assert("f->temp_offset == f->alloc.alloc_buffer_length_in_bytes" , "src/siege/internal/stb/stb_vorbis.c", 4092)); | |||
4093 | // check if there's enough temp memory so we don't error later | |||
4094 | if (f->setup_offset + sizeof(*f) + f->temp_memory_required > (unsigned) f->temp_offset) | |||
4095 | return error(f, VORBIS_outofmem); | |||
4096 | } | |||
4097 | ||||
4098 | f->first_audio_page_offset = stb_vorbis_get_file_offset(f); | |||
4099 | ||||
4100 | return TRUE1; | |||
4101 | } | |||
4102 | ||||
4103 | static void vorbis_deinit(stb_vorbis *p) | |||
4104 | { | |||
4105 | int i,j; | |||
4106 | for (i=0; i < p->residue_count; ++i) { | |||
4107 | Residue *r = p->residue_config+i; | |||
4108 | if (r->classdata) { | |||
4109 | for (j=0; j < p->codebooks[r->classbook].entries; ++j) | |||
4110 | setup_free(p, r->classdata[j]); | |||
4111 | setup_free(p, r->classdata); | |||
4112 | } | |||
4113 | setup_free(p, r->residue_books); | |||
4114 | } | |||
4115 | ||||
4116 | if (p->codebooks) { | |||
4117 | for (i=0; i < p->codebook_count; ++i) { | |||
4118 | Codebook *c = p->codebooks + i; | |||
4119 | setup_free(p, c->codeword_lengths); | |||
4120 | setup_free(p, c->multiplicands); | |||
4121 | setup_free(p, c->codewords); | |||
4122 | setup_free(p, c->sorted_codewords); | |||
4123 | // c->sorted_values[-1] is the first entry in the array | |||
4124 | setup_free(p, c->sorted_values ? c->sorted_values-1 : NULL((void*)0)); | |||
4125 | } | |||
4126 | setup_free(p, p->codebooks); | |||
4127 | } | |||
4128 | setup_free(p, p->floor_config); | |||
4129 | setup_free(p, p->residue_config); | |||
4130 | for (i=0; i < p->mapping_count; ++i) | |||
4131 | setup_free(p, p->mapping[i].chan); | |||
4132 | setup_free(p, p->mapping); | |||
4133 | for (i=0; i < p->channels; ++i) { | |||
4134 | setup_free(p, p->channel_buffers[i]); | |||
4135 | setup_free(p, p->previous_window[i]); | |||
4136 | #ifdef STB_VORBIS_NO_DEFER_FLOOR | |||
4137 | setup_free(p, p->floor_buffers[i]); | |||
4138 | #endif | |||
4139 | setup_free(p, p->finalY[i]); | |||
4140 | } | |||
4141 | for (i=0; i < 2; ++i) { | |||
4142 | setup_free(p, p->A[i]); | |||
4143 | setup_free(p, p->B[i]); | |||
4144 | setup_free(p, p->C(2 | 4 | 1)[i]); | |||
4145 | setup_free(p, p->window[i]); | |||
4146 | } | |||
4147 | #ifndef STB_VORBIS_NO_STDIO | |||
4148 | if (p->close_on_free) fclose(p->f); | |||
4149 | #endif | |||
4150 | } | |||
4151 | ||||
4152 | void stb_vorbis_close(stb_vorbis *p) | |||
4153 | { | |||
4154 | if (p == NULL((void*)0)) return; | |||
4155 | vorbis_deinit(p); | |||
4156 | setup_free(p,p); | |||
4157 | } | |||
4158 | ||||
4159 | static void vorbis_init(stb_vorbis *p, stb_vorbis_alloc *z) | |||
4160 | { | |||
4161 | memset(p, 0, sizeof(*p)); // NULL out all malloc'd pointers to start | |||
4162 | if (z) { | |||
4163 | p->alloc = *z; | |||
4164 | p->alloc.alloc_buffer_length_in_bytes = (p->alloc.alloc_buffer_length_in_bytes+3) & ~3; | |||
4165 | p->temp_offset = p->alloc.alloc_buffer_length_in_bytes; | |||
4166 | } | |||
4167 | p->eof = 0; | |||
4168 | p->error = VORBIS__no_error; | |||
4169 | p->stream = NULL((void*)0); | |||
4170 | p->codebooks = NULL((void*)0); | |||
4171 | p->page_crc_tests = -1; | |||
4172 | #ifndef STB_VORBIS_NO_STDIO | |||
4173 | p->close_on_free = FALSE0; | |||
4174 | p->f = NULL((void*)0); | |||
4175 | #endif | |||
4176 | } | |||
4177 | ||||
4178 | int stb_vorbis_get_sample_offset(stb_vorbis *f) | |||
4179 | { | |||
4180 | if (f->current_loc_valid) | |||
4181 | return f->current_loc; | |||
4182 | else | |||
4183 | return -1; | |||
4184 | } | |||
4185 | ||||
4186 | stb_vorbis_info stb_vorbis_get_info(stb_vorbis *f) | |||
4187 | { | |||
4188 | stb_vorbis_info d; | |||
4189 | d.channels = f->channels; | |||
4190 | d.sample_rate = f->sample_rate; | |||
4191 | d.setup_memory_required = f->setup_memory_required; | |||
4192 | d.setup_temp_memory_required = f->setup_temp_memory_required; | |||
4193 | d.temp_memory_required = f->temp_memory_required; | |||
4194 | d.max_frame_size = f->blocksize_1 >> 1; | |||
4195 | return d; | |||
4196 | } | |||
4197 | ||||
4198 | int stb_vorbis_get_error(stb_vorbis *f) | |||
4199 | { | |||
4200 | int e = f->error; | |||
4201 | f->error = VORBIS__no_error; | |||
4202 | return e; | |||
4203 | } | |||
4204 | ||||
4205 | static stb_vorbis * vorbis_alloc(stb_vorbis *f) | |||
4206 | { | |||
4207 | stb_vorbis *p = (stb_vorbis *) setup_malloc(f, sizeof(*p)); | |||
4208 | return p; | |||
4209 | } | |||
4210 | ||||
4211 | #ifndef STB_VORBIS_NO_PUSHDATA_API | |||
4212 | ||||
4213 | void stb_vorbis_flush_pushdata(stb_vorbis *f) | |||
4214 | { | |||
4215 | f->previous_length = 0; | |||
4216 | f->page_crc_tests = 0; | |||
4217 | f->discard_samples_deferred = 0; | |||
4218 | f->current_loc_valid = FALSE0; | |||
4219 | f->first_decode = FALSE0; | |||
4220 | f->samples_output = 0; | |||
4221 | f->channel_buffer_start = 0; | |||
4222 | f->channel_buffer_end = 0; | |||
4223 | } | |||
4224 | ||||
4225 | static int vorbis_search_for_page_pushdata(vorb *f, uint8 *data, int data_len) | |||
4226 | { | |||
4227 | int i,n; | |||
4228 | for (i=0; i < f->page_crc_tests; ++i) | |||
4229 | f->scan[i].bytes_done = 0; | |||
4230 | ||||
4231 | // if we have room for more scans, search for them first, because | |||
4232 | // they may cause us to stop early if their header is incomplete | |||
4233 | if (f->page_crc_tests < STB_VORBIS_PUSHDATA_CRC_COUNT4) { | |||
4234 | if (data_len < 4) return 0; | |||
4235 | data_len -= 3; // need to look for 4-byte sequence, so don't miss | |||
4236 | // one that straddles a boundary | |||
4237 | for (i=0; i < data_len; ++i) { | |||
4238 | if (data[i] == 0x4f) { | |||
4239 | if (0==memcmp(data+i, ogg_page_header, 4)) { | |||
4240 | int j,len; | |||
4241 | uint32 crc; | |||
4242 | // make sure we have the whole page header | |||
4243 | if (i+26 >= data_len || i+27+data[i+26] >= data_len) { | |||
4244 | // only read up to this page start, so hopefully we'll | |||
4245 | // have the whole page header start next time | |||
4246 | data_len = i; | |||
4247 | break; | |||
4248 | } | |||
4249 | // ok, we have it all; compute the length of the page | |||
4250 | len = 27 + data[i+26]; | |||
4251 | for (j=0; j < data[i+26]; ++j) | |||
4252 | len += data[i+27+j]; | |||
4253 | // scan everything up to the embedded crc (which we must 0) | |||
4254 | crc = 0; | |||
4255 | for (j=0; j < 22; ++j) | |||
4256 | crc = crc32_update(crc, data[i+j]); | |||
4257 | // now process 4 0-bytes | |||
4258 | for ( ; j < 26; ++j) | |||
4259 | crc = crc32_update(crc, 0); | |||
4260 | // len is the total number of bytes we need to scan | |||
4261 | n = f->page_crc_tests++; | |||
4262 | f->scan[n].bytes_left = len-j; | |||
4263 | f->scan[n].crc_so_far = crc; | |||
4264 | f->scan[n].goal_crc = data[i+22] + (data[i+23] << 8) + (data[i+24]<<16) + (data[i+25]<<24); | |||
4265 | // if the last frame on a page is continued to the next, then | |||
4266 | // we can't recover the sample_loc immediately | |||
4267 | if (data[i+27+data[i+26]-1] == 255) | |||
4268 | f->scan[n].sample_loc = ~0; | |||
4269 | else | |||
4270 | f->scan[n].sample_loc = data[i+6] + (data[i+7] << 8) + (data[i+ 8]<<16) + (data[i+ 9]<<24); | |||
4271 | f->scan[n].bytes_done = i+j; | |||
4272 | if (f->page_crc_tests == STB_VORBIS_PUSHDATA_CRC_COUNT4) | |||
4273 | break; | |||
4274 | // keep going if we still have room for more | |||
4275 | } | |||
4276 | } | |||
4277 | } | |||
4278 | } | |||
4279 | ||||
4280 | for (i=0; i < f->page_crc_tests;) { | |||
4281 | uint32 crc; | |||
4282 | int j; | |||
4283 | int n = f->scan[i].bytes_done; | |||
4284 | int m = f->scan[i].bytes_left; | |||
4285 | if (m > data_len - n) m = data_len - n; | |||
4286 | // m is the bytes to scan in the current chunk | |||
4287 | crc = f->scan[i].crc_so_far; | |||
4288 | for (j=0; j < m; ++j) | |||
4289 | crc = crc32_update(crc, data[n+j]); | |||
4290 | f->scan[i].bytes_left -= m; | |||
4291 | f->scan[i].crc_so_far = crc; | |||
4292 | if (f->scan[i].bytes_left == 0) { | |||
4293 | // does it match? | |||
4294 | if (f->scan[i].crc_so_far == f->scan[i].goal_crc) { | |||
4295 | // Houston, we have page | |||
4296 | data_len = n+m; // consumption amount is wherever that scan ended | |||
4297 | f->page_crc_tests = -1; // drop out of page scan mode | |||
4298 | f->previous_length = 0; // decode-but-don't-output one frame | |||
4299 | f->next_seg = -1; // start a new page | |||
4300 | f->current_loc = f->scan[i].sample_loc; // set the current sample location | |||
4301 | // to the amount we'd have decoded had we decoded this page | |||
4302 | f->current_loc_valid = f->current_loc != ~0; | |||
4303 | return data_len; | |||
4304 | } | |||
4305 | // delete entry | |||
4306 | f->scan[i] = f->scan[--f->page_crc_tests]; | |||
4307 | } else { | |||
4308 | ++i; | |||
4309 | } | |||
4310 | } | |||
4311 | ||||
4312 | return data_len; | |||
4313 | } | |||
4314 | ||||
4315 | // return value: number of bytes we used | |||
4316 | int stb_vorbis_decode_frame_pushdata( | |||
4317 | stb_vorbis *f, // the file we're decoding | |||
4318 | uint8 *data, int data_len, // the memory available for decoding | |||
4319 | int *channels, // place to write number of float * buffers | |||
4320 | float ***output, // place to write float ** array of float * buffers | |||
4321 | int *samples // place to write number of output samples | |||
4322 | ) | |||
4323 | { | |||
4324 | int i; | |||
4325 | int len,right,left; | |||
4326 | ||||
4327 | if (!IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); | |||
4328 | ||||
4329 | if (f->page_crc_tests >= 0) { | |||
4330 | *samples = 0; | |||
4331 | return vorbis_search_for_page_pushdata(f, data, data_len); | |||
4332 | } | |||
4333 | ||||
4334 | f->stream = data; | |||
4335 | f->stream_end = data + data_len; | |||
4336 | f->error = VORBIS__no_error; | |||
4337 | ||||
4338 | // check that we have the entire packet in memory | |||
4339 | if (!is_whole_packet_present(f, FALSE0)) { | |||
4340 | *samples = 0; | |||
4341 | return 0; | |||
4342 | } | |||
4343 | ||||
4344 | if (!vorbis_decode_packet(f, &len, &left, &right)) { | |||
4345 | // save the actual error we encountered | |||
4346 | enum STBVorbisError error = f->error; | |||
4347 | if (error == VORBIS_bad_packet_type) { | |||
4348 | // flush and resynch | |||
4349 | f->error = VORBIS__no_error; | |||
4350 | while (get8_packet(f) != EOP(-1)) | |||
4351 | if (f->eof) break; | |||
4352 | *samples = 0; | |||
4353 | return f->stream - data; | |||
4354 | } | |||
4355 | if (error == VORBIS_continued_packet_flag_invalid) { | |||
4356 | if (f->previous_length == 0) { | |||
4357 | // we may be resynching, in which case it's ok to hit one | |||
4358 | // of these; just discard the packet | |||
4359 | f->error = VORBIS__no_error; | |||
4360 | while (get8_packet(f) != EOP(-1)) | |||
4361 | if (f->eof) break; | |||
4362 | *samples = 0; | |||
4363 | return f->stream - data; | |||
4364 | } | |||
4365 | } | |||
4366 | // if we get an error while parsing, what to do? | |||
4367 | // well, it DEFINITELY won't work to continue from where we are! | |||
4368 | stb_vorbis_flush_pushdata(f); | |||
4369 | // restore the error that actually made us bail | |||
4370 | f->error = error; | |||
4371 | *samples = 0; | |||
4372 | return 1; | |||
4373 | } | |||
4374 | ||||
4375 | // success! | |||
4376 | len = vorbis_finish_frame(f, len, left, right); | |||
4377 | for (i=0; i < f->channels; ++i) | |||
4378 | f->outputs[i] = f->channel_buffers[i] + left; | |||
4379 | ||||
4380 | if (channels) *channels = f->channels; | |||
4381 | *samples = len; | |||
4382 | *output = f->outputs; | |||
4383 | return f->stream - data; | |||
4384 | } | |||
4385 | ||||
4386 | stb_vorbis *stb_vorbis_open_pushdata( | |||
4387 | unsigned char *data, int data_len, // the memory available for decoding | |||
4388 | int *data_used, // only defined if result is not NULL | |||
4389 | int *error, stb_vorbis_alloc *alloc) | |||
4390 | { | |||
4391 | stb_vorbis *f, p; | |||
4392 | vorbis_init(&p, alloc); | |||
4393 | p.stream = data; | |||
4394 | p.stream_end = data + data_len; | |||
4395 | p.push_mode = TRUE1; | |||
4396 | if (!start_decoder(&p)) { | |||
4397 | if (p.eof) | |||
4398 | *error = VORBIS_need_more_data; | |||
4399 | else | |||
4400 | *error = p.error; | |||
4401 | return NULL((void*)0); | |||
4402 | } | |||
4403 | f = vorbis_alloc(&p); | |||
4404 | if (f) { | |||
4405 | *f = p; | |||
4406 | *data_used = f->stream - data; | |||
4407 | *error = 0; | |||
4408 | return f; | |||
4409 | } else { | |||
4410 | vorbis_deinit(&p); | |||
4411 | return NULL((void*)0); | |||
4412 | } | |||
4413 | } | |||
4414 | #endif // STB_VORBIS_NO_PUSHDATA_API | |||
4415 | ||||
4416 | unsigned int stb_vorbis_get_file_offset(stb_vorbis *f) | |||
4417 | { | |||
4418 | #ifndef STB_VORBIS_NO_PUSHDATA_API | |||
4419 | if (f->push_mode) return 0; | |||
4420 | #endif | |||
4421 | if (USE_MEMORY(f)((f)->stream)) return f->stream - f->stream_start; | |||
4422 | #ifndef STB_VORBIS_NO_STDIO | |||
4423 | return ftell(f->f) - f->f_start; | |||
4424 | #endif | |||
4425 | } | |||
4426 | ||||
4427 | #ifndef STB_VORBIS_NO_PULLDATA_API | |||
4428 | // | |||
4429 | // DATA-PULLING API | |||
4430 | // | |||
4431 | ||||
4432 | static uint32 vorbis_find_page(stb_vorbis *f, uint32 *end, uint32 *last) | |||
4433 | { | |||
4434 | for(;;) { | |||
4435 | int n; | |||
4436 | if (f->eof) return 0; | |||
4437 | n = get8(f); | |||
4438 | if (n == 0x4f) { // page header | |||
4439 | unsigned int retry_loc = stb_vorbis_get_file_offset(f); | |||
4440 | int i; | |||
4441 | // check if we're off the end of a file_section stream | |||
4442 | if (retry_loc - 25 > f->stream_len) | |||
4443 | return 0; | |||
4444 | // check the rest of the header | |||
4445 | for (i=1; i < 4; ++i) | |||
4446 | if (get8(f) != ogg_page_header[i]) | |||
4447 | break; | |||
4448 | if (f->eof) return 0; | |||
4449 | if (i == 4) { | |||
4450 | uint8 header[27]; | |||
4451 | uint32 i, crc, goal, len; | |||
4452 | for (i=0; i < 4; ++i) | |||
4453 | header[i] = ogg_page_header[i]; | |||
4454 | for (; i < 27; ++i) | |||
4455 | header[i] = get8(f); | |||
4456 | if (f->eof) return 0; | |||
4457 | if (header[4] != 0) goto invalid; | |||
4458 | goal = header[22] + (header[23] << 8) + (header[24]<<16) + (header[25]<<24); | |||
4459 | for (i=22; i < 26; ++i) | |||
4460 | header[i] = 0; | |||
4461 | crc = 0; | |||
4462 | for (i=0; i < 27; ++i) | |||
4463 | crc = crc32_update(crc, header[i]); | |||
4464 | len = 0; | |||
4465 | for (i=0; i < header[26]; ++i) { | |||
4466 | int s = get8(f); | |||
4467 | crc = crc32_update(crc, s); | |||
4468 | len += s; | |||
4469 | } | |||
4470 | if (len && f->eof) return 0; | |||
4471 | for (i=0; i < len; ++i) | |||
4472 | crc = crc32_update(crc, get8(f)); | |||
4473 | // finished parsing probable page | |||
4474 | if (crc == goal) { | |||
4475 | // we could now check that it's either got the last | |||
4476 | // page flag set, OR it's followed by the capture | |||
4477 | // pattern, but I guess TECHNICALLY you could have | |||
4478 | // a file with garbage between each ogg page and recover | |||
4479 | // from it automatically? So even though that paranoia | |||
4480 | // might decrease the chance of an invalid decode by | |||
4481 | // another 2^32, not worth it since it would hose those | |||
4482 | // invalid-but-useful files? | |||
4483 | if (end) | |||
4484 | *end = stb_vorbis_get_file_offset(f); | |||
4485 | if (last) | |||
4486 | { | |||
4487 | if (header[5] & 0x04) | |||
4488 | *last = 1; | |||
4489 | else | |||
4490 | *last = 0; | |||
4491 | } | |||
4492 | set_file_offset(f, retry_loc-1); | |||
4493 | return 1; | |||
4494 | } | |||
4495 | } | |||
4496 | invalid: | |||
4497 | // not a valid page, so rewind and look for next one | |||
4498 | set_file_offset(f, retry_loc); | |||
4499 | } | |||
4500 | } | |||
4501 | } | |||
4502 | ||||
4503 | // seek is implemented with 'interpolation search'--this is like | |||
4504 | // binary search, but we use the data values to estimate the likely | |||
4505 | // location of the data item (plus a bit of a bias so when the | |||
4506 | // estimation is wrong we don't waste overly much time) | |||
4507 | ||||
4508 | #define SAMPLE_unknown0xffffffff 0xffffffff | |||
4509 | ||||
4510 | ||||
4511 | // ogg vorbis, in its insane infinite wisdom, only provides | |||
4512 | // information about the sample at the END of the page. | |||
4513 | // therefore we COULD have the data we need in the current | |||
4514 | // page, and not know it. we could just use the end location | |||
4515 | // as our only knowledge for bounds, seek back, and eventually | |||
4516 | // the binary search finds it. or we can try to be smart and | |||
4517 | // not waste time trying to locate more pages. we try to be | |||
4518 | // smart, since this data is already in memory anyway, so | |||
4519 | // doing needless I/O would be crazy! | |||
4520 | static int vorbis_analyze_page(stb_vorbis *f, ProbedPage *z) | |||
4521 | { | |||
4522 | uint8 header[27], lacing[255]; | |||
4523 | uint8 packet_type[255]; | |||
4524 | int num_packet, packet_start, previous =0; | |||
4525 | (void)previous; | |||
4526 | int i,len; | |||
4527 | uint32 samples; | |||
4528 | ||||
4529 | // record where the page starts | |||
4530 | z->page_start = stb_vorbis_get_file_offset(f); | |||
4531 | ||||
4532 | // parse the header | |||
4533 | getn(f, header, 27); | |||
4534 | assert(header[0] == 'O' && header[1] == 'g' && header[2] == 'g' && header[3] == 'S')((header[0] == 'O' && header[1] == 'g' && header [2] == 'g' && header[3] == 'S') ? (void)0 : _assert("header[0] == 'O' && header[1] == 'g' && header[2] == 'g' && header[3] == 'S'" , "src/siege/internal/stb/stb_vorbis.c", 4534)); | |||
4535 | getn(f, lacing, header[26]); | |||
4536 | ||||
4537 | // determine the length of the payload | |||
4538 | len = 0; | |||
4539 | for (i=0; i < header[26]; ++i) | |||
4540 | len += lacing[i]; | |||
| ||||
4541 | ||||
4542 | // this implies where the page ends | |||
4543 | z->page_end = z->page_start + 27 + header[26] + len; | |||
4544 | ||||
4545 | // read the last-decoded sample out of the data | |||
4546 | z->last_decoded_sample = header[6] + (header[7] << 8) + (header[8] << 16) + (header[9] << 16); | |||
4547 | ||||
4548 | if (header[5] & 4) { | |||
4549 | // if this is the last page, it's not possible to work | |||
4550 | // backwards to figure out the first sample! whoops! fuck. | |||
4551 | z->first_decoded_sample = SAMPLE_unknown0xffffffff; | |||
4552 | set_file_offset(f, z->page_start); | |||
4553 | return 1; | |||
4554 | } | |||
4555 | ||||
4556 | // scan through the frames to determine the sample-count of each one... | |||
4557 | // our goal is the sample # of the first fully-decoded sample on the | |||
4558 | // page, which is the first decoded sample of the 2nd page | |||
4559 | ||||
4560 | num_packet=0; | |||
4561 | ||||
4562 | packet_start = ((header[5] & 1) == 0); | |||
4563 | ||||
4564 | for (i=0; i < header[26]; ++i) { | |||
4565 | if (packet_start) { | |||
4566 | uint8 n,b,m; | |||
4567 | if (lacing[i] == 0) goto bail; // trying to read from zero-length packet | |||
4568 | n = get8(f); | |||
4569 | // if bottom bit is non-zero, we've got corruption | |||
4570 | if (n & 1) goto bail; | |||
4571 | n >>= 1; | |||
4572 | b = ilog(f->mode_count-1); | |||
4573 | m = n >> b; | |||
4574 | n &= (1 << b)-1; | |||
4575 | if (n >= f->mode_count) goto bail; | |||
4576 | if (num_packet == 0 && f->mode_config[n].blockflag) | |||
4577 | previous = (m & 1); | |||
4578 | packet_type[num_packet++] = f->mode_config[n].blockflag; | |||
4579 | skip(f, lacing[i]-1); | |||
4580 | } else | |||
4581 | skip(f, lacing[i]); | |||
4582 | packet_start = (lacing[i] < 255); | |||
4583 | } | |||
4584 | ||||
4585 | // now that we know the sizes of all the pages, we can start determining | |||
4586 | // how much sample data there is. | |||
4587 | ||||
4588 | samples = 0; | |||
4589 | ||||
4590 | // for the last packet, we step by its whole length, because the definition | |||
4591 | // is that we encoded the end sample loc of the 'last packet completed', | |||
4592 | // where 'completed' refers to packets being split, and we are left to guess | |||
4593 | // what 'end sample loc' means. we assume it means ignoring the fact that | |||
4594 | // the last half of the data is useless without windowing against the next | |||
4595 | // packet... (so it's not REALLY complete in that sense) | |||
4596 | if (num_packet > 1) | |||
4597 | samples += f->blocksize[packet_type[num_packet-1]]; | |||
4598 | ||||
4599 | for (i=num_packet-2; i >= 1; --i) { | |||
4600 | // now, for this packet, how many samples do we have that | |||
4601 | // do not overlap the following packet? | |||
4602 | if (packet_type[i] == 1) | |||
4603 | if (packet_type[i+1] == 1) | |||
4604 | samples += f->blocksize_1 >> 1; | |||
4605 | else | |||
4606 | samples += ((f->blocksize_1 - f->blocksize_0) >> 2) + (f->blocksize_0 >> 1); | |||
4607 | else | |||
4608 | samples += f->blocksize_0 >> 1; | |||
4609 | } | |||
4610 | // now, at this point, we've rewound to the very beginning of the | |||
4611 | // _second_ packet. if we entirely discard the first packet after | |||
4612 | // a seek, this will be exactly the right sample number. HOWEVER! | |||
4613 | // we can't as easily compute this number for the LAST page. The | |||
4614 | // only way to get the sample offset of the LAST page is to use | |||
4615 | // the end loc from the previous page. But what that returns us | |||
4616 | // is _exactly_ the place where we get our first non-overlapped | |||
4617 | // sample. (I think. Stupid spec for being ambiguous.) So for | |||
4618 | // consistency it's better to do that here, too. However, that | |||
4619 | // will then require us to NOT discard all of the first frame we | |||
4620 | // decode, in some cases, which means an even weirder frame size | |||
4621 | // and extra code. what a fucking pain. | |||
4622 | ||||
4623 | // we're going to discard the first packet if we | |||
4624 | // start the seek here, so we don't care about it. (we could actually | |||
4625 | // do better; if the first packet is long, and the previous packet | |||
4626 | // is short, there's actually data in the first half of the first | |||
4627 | // packet that doesn't need discarding... but not worth paying the | |||
4628 | // effort of tracking that of that here and in the seeking logic) | |||
4629 | // except crap, if we infer it from the _previous_ packet's end | |||
4630 | // location, we DO need to use that definition... and we HAVE to | |||
4631 | // infer the start loc of the LAST packet from the previous packet's | |||
4632 | // end location. fuck you, ogg vorbis. | |||
4633 | ||||
4634 | z->first_decoded_sample = z->last_decoded_sample - samples; | |||
4635 | ||||
4636 | // restore file state to where we were | |||
4637 | set_file_offset(f, z->page_start); | |||
4638 | return 1; | |||
4639 | ||||
4640 | // restore file state to where we were | |||
4641 | bail: | |||
4642 | set_file_offset(f, z->page_start); | |||
4643 | return 0; | |||
4644 | } | |||
4645 | ||||
4646 | static int vorbis_seek_frame_from_page(stb_vorbis *f, uint32 page_start, uint32 first_sample, uint32 target_sample, int fine) | |||
4647 | { | |||
4648 | int left_start, left_end, right_start, right_end, mode,i; | |||
4649 | int frame=0; | |||
4650 | uint32 frame_start; | |||
4651 | int frames_to_skip, data_to_skip; | |||
4652 | ||||
4653 | // first_sample is the sample # of the first sample that doesn't | |||
4654 | // overlap the previous page... note that this requires us to | |||
4655 | // _partially_ discard the first packet! bleh. | |||
4656 | set_file_offset(f, page_start); | |||
4657 | ||||
4658 | f->next_seg = -1; // force page resync | |||
4659 | ||||
4660 | frame_start = first_sample; | |||
4661 | // frame start is where the previous packet's last decoded sample | |||
4662 | // was, which corresponds to left_end... EXCEPT if the previous | |||
4663 | // packet was long and this packet is short? Probably a bug here. | |||
4664 | ||||
4665 | ||||
4666 | // now, we can start decoding frames... we'll only FAKE decode them, | |||
4667 | // until we find the frame that contains our sample; then we'll rewind, | |||
4668 | // and try again | |||
4669 | for (;;) { | |||
4670 | int start; | |||
4671 | ||||
4672 | if (!vorbis_decode_initial(f, &left_start, &left_end, &right_start, &right_end, &mode)) | |||
4673 | return error(f, VORBIS_seek_failed); | |||
4674 | ||||
4675 | if (frame == 0) | |||
4676 | start = left_end; | |||
4677 | else | |||
4678 | start = left_start; | |||
4679 | ||||
4680 | // the window starts at left_start; the last valid sample we generate | |||
4681 | // before the next frame's window start is right_start-1 | |||
4682 | if (target_sample < frame_start + right_start-start) | |||
4683 | break; | |||
4684 | ||||
4685 | flush_packet(f); | |||
4686 | if (f->eof) | |||
4687 | return error(f, VORBIS_seek_failed); | |||
4688 | ||||
4689 | frame_start += right_start - start; | |||
4690 | ||||
4691 | ++frame; | |||
4692 | } | |||
4693 | ||||
4694 | // ok, at this point, the sample we want is contained in frame #'frame' | |||
4695 | ||||
4696 | // to decode frame #'frame' normally, we have to decode the | |||
4697 | // previous frame first... but if it's the FIRST frame of the page | |||
4698 | // we can't. if it's the first frame, it means it falls in the part | |||
4699 | // of the first frame that doesn't overlap either of the other frames. | |||
4700 | // so, if we have to handle that case for the first frame, we might | |||
4701 | // as well handle it for all of them, so: | |||
4702 | if (target_sample > frame_start + (left_end - left_start)) { | |||
4703 | // so what we want to do is go ahead and just immediately decode | |||
4704 | // this frame, but then make it so the next get_frame_float() uses | |||
4705 | // this already-decoded data? or do we want to go ahead and rewind, | |||
4706 | // and leave a flag saying to skip the first N data? let's do that | |||
4707 | frames_to_skip = frame; // if this is frame #1, skip 1 frame (#0) | |||
4708 | data_to_skip = left_end - left_start; | |||
4709 | } else { | |||
4710 | // otherwise, we want to skip frames 0, 1, 2, ... frame-2 | |||
4711 | // (which means frame-2+1 total frames) then decode frame-1, | |||
4712 | // then leave frame pending | |||
4713 | frames_to_skip = frame - 1; | |||
4714 | assert(frames_to_skip >= 0)((frames_to_skip >= 0) ? (void)0 : _assert("frames_to_skip >= 0" , "src/siege/internal/stb/stb_vorbis.c", 4714)); | |||
4715 | data_to_skip = -1; | |||
4716 | } | |||
4717 | ||||
4718 | set_file_offset(f, page_start); | |||
4719 | f->next_seg = - 1; // force page resync | |||
4720 | ||||
4721 | for (i=0; i < frames_to_skip; ++i) { | |||
4722 | maybe_start_packet(f); | |||
4723 | flush_packet(f); | |||
4724 | } | |||
4725 | ||||
4726 | if (data_to_skip >= 0) { | |||
4727 | int i,j,n = f->blocksize_0 >> 1; | |||
4728 | f->discard_samples_deferred = data_to_skip; | |||
4729 | for (i=0; i < f->channels; ++i) | |||
4730 | for (j=0; j < n; ++j) | |||
4731 | f->previous_window[i][j] = 0; | |||
4732 | f->previous_length = n; | |||
4733 | frame_start += data_to_skip; | |||
4734 | } else { | |||
4735 | f->previous_length = 0; | |||
4736 | vorbis_pump_first_frame(f); | |||
4737 | } | |||
4738 | ||||
4739 | // at this point, the NEXT decoded frame will generate the desired sample | |||
4740 | if (fine) { | |||
4741 | // so if we're doing sample accurate streaming, we want to go ahead and decode it! | |||
4742 | if (target_sample != frame_start) { | |||
4743 | int n; | |||
4744 | stb_vorbis_get_frame_float(f, &n, NULL((void*)0)); | |||
4745 | assert(target_sample > frame_start)((target_sample > frame_start) ? (void)0 : _assert("target_sample > frame_start" , "src/siege/internal/stb/stb_vorbis.c", 4745)); | |||
4746 | assert(f->channel_buffer_start + (int) (target_sample-frame_start) < f->channel_buffer_end)((f->channel_buffer_start + (int) (target_sample-frame_start ) < f->channel_buffer_end) ? (void)0 : _assert("f->channel_buffer_start + (int) (target_sample-frame_start) < f->channel_buffer_end" , "src/siege/internal/stb/stb_vorbis.c", 4746)); | |||
4747 | f->channel_buffer_start += (target_sample - frame_start); | |||
4748 | } | |||
4749 | } | |||
4750 | ||||
4751 | return 0; | |||
4752 | } | |||
4753 | ||||
4754 | static int vorbis_seek_base(stb_vorbis *f, unsigned int sample_number, int fine) | |||
4755 | { | |||
4756 | ProbedPage p[2],q; | |||
4757 | if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); | |||
4758 | ||||
4759 | // do we know the location of the last page? | |||
4760 | if (f->p_last.page_start == 0) { | |||
4761 | uint32 z = stb_vorbis_stream_length_in_samples(f); | |||
4762 | if (z == 0) return error(f, VORBIS_cant_find_last_page); | |||
4763 | } | |||
4764 | ||||
4765 | p[0] = f->p_first; | |||
4766 | p[1] = f->p_last; | |||
4767 | ||||
4768 | if (sample_number >= f->p_last.last_decoded_sample) | |||
4769 | sample_number = f->p_last.last_decoded_sample-1; | |||
4770 | ||||
4771 | if (sample_number < f->p_first.last_decoded_sample) { | |||
4772 | vorbis_seek_frame_from_page(f, p[0].page_start, 0, sample_number, fine); | |||
4773 | return 0; | |||
4774 | } else { | |||
4775 | int attempts=0; | |||
4776 | while (p[0].page_end < p[1].page_start) { | |||
4777 | uint32 probe; | |||
4778 | uint32 start_offset, end_offset; | |||
4779 | uint32 start_sample, end_sample; | |||
4780 | ||||
4781 | // copy these into local variables so we can tweak them | |||
4782 | // if any are unknown | |||
4783 | start_offset = p[0].page_end; | |||
4784 | end_offset = p[1].after_previous_page_start; // an address known to seek to page p[1] | |||
4785 | start_sample = p[0].last_decoded_sample; | |||
4786 | end_sample = p[1].last_decoded_sample; | |||
4787 | ||||
4788 | // currently there is no such tweaking logic needed/possible? | |||
4789 | if (start_sample == SAMPLE_unknown0xffffffff || end_sample == SAMPLE_unknown0xffffffff) | |||
4790 | return error(f, VORBIS_seek_failed); | |||
4791 | ||||
4792 | // now we want to lerp between these for the target samples... | |||
4793 | ||||
4794 | // step 1: we need to bias towards the page start... | |||
4795 | if (start_offset + 4000 < end_offset) | |||
4796 | end_offset -= 4000; | |||
4797 | ||||
4798 | // now compute an interpolated search loc | |||
4799 | probe = start_offset + (int) floor((float) (end_offset - start_offset) / (end_sample - start_sample) * (sample_number - start_sample)); | |||
4800 | ||||
4801 | // next we need to bias towards binary search... | |||
4802 | // code is a little wonky to allow for full 32-bit unsigned values | |||
4803 | if (attempts >= 4) { | |||
4804 | uint32 probe2 = start_offset + ((end_offset - start_offset) >> 1); | |||
4805 | if (attempts >= 8) | |||
4806 | probe = probe2; | |||
4807 | else if (probe < probe2) | |||
4808 | probe = probe + ((probe2 - probe) >> 1); | |||
4809 | else | |||
4810 | probe = probe2 + ((probe - probe2) >> 1); | |||
4811 | } | |||
4812 | ++attempts; | |||
4813 | ||||
4814 | set_file_offset(f, probe); | |||
4815 | if (!vorbis_find_page(f, NULL((void*)0), NULL((void*)0))) return error(f, VORBIS_seek_failed); | |||
4816 | if (!vorbis_analyze_page(f, &q)) return error(f, VORBIS_seek_failed); | |||
4817 | q.after_previous_page_start = probe; | |||
4818 | ||||
4819 | // it's possible we've just found the last page again | |||
4820 | if (q.page_start == p[1].page_start) { | |||
4821 | p[1] = q; | |||
4822 | continue; | |||
4823 | } | |||
4824 | ||||
4825 | if (sample_number < q.last_decoded_sample) | |||
4826 | p[1] = q; | |||
4827 | else | |||
4828 | p[0] = q; | |||
4829 | } | |||
4830 | ||||
4831 | if (p[0].last_decoded_sample <= sample_number && sample_number < p[1].last_decoded_sample) { | |||
4832 | vorbis_seek_frame_from_page(f, p[1].page_start, p[0].last_decoded_sample, sample_number, fine); | |||
4833 | return 0; | |||
4834 | } | |||
4835 | return error(f, VORBIS_seek_failed); | |||
4836 | } | |||
4837 | } | |||
4838 | ||||
4839 | int stb_vorbis_seek_frame(stb_vorbis *f, unsigned int sample_number) | |||
4840 | { | |||
4841 | return vorbis_seek_base(f, sample_number, FALSE0); | |||
| ||||
4842 | } | |||
4843 | ||||
4844 | int stb_vorbis_seek(stb_vorbis *f, unsigned int sample_number) | |||
4845 | { | |||
4846 | return vorbis_seek_base(f, sample_number, TRUE1); | |||
4847 | } | |||
4848 | ||||
4849 | void stb_vorbis_seek_start(stb_vorbis *f) | |||
4850 | { | |||
4851 | if (IS_PUSH_MODE(f)((f)->push_mode)) { error(f, VORBIS_invalid_api_mixing); return; } | |||
4852 | set_file_offset(f, f->first_audio_page_offset); | |||
4853 | f->previous_length = 0; | |||
4854 | f->first_decode = TRUE1; | |||
4855 | f->next_seg = -1; | |||
4856 | vorbis_pump_first_frame(f); | |||
4857 | } | |||
4858 | ||||
4859 | unsigned int stb_vorbis_stream_length_in_samples(stb_vorbis *f) | |||
4860 | { | |||
4861 | unsigned int restore_offset, previous_safe; | |||
4862 | unsigned int end, last_page_loc; | |||
4863 | ||||
4864 | if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); | |||
4865 | if (!f->total_samples) { | |||
4866 | int last; | |||
4867 | uint32 lo,hi; | |||
4868 | char header[6]; | |||
4869 | ||||
4870 | // first, store the current decode position so we can restore it | |||
4871 | restore_offset = stb_vorbis_get_file_offset(f); | |||
4872 | ||||
4873 | // now we want to seek back 64K from the end (the last page must | |||
4874 | // be at most a little less than 64K, but let's allow a little slop) | |||
4875 | if (f->stream_len >= 65536 && f->stream_len-65536 >= f->first_audio_page_offset) | |||
4876 | previous_safe = f->stream_len - 65536; | |||
4877 | else | |||
4878 | previous_safe = f->first_audio_page_offset; | |||
4879 | ||||
4880 | set_file_offset(f, previous_safe); | |||
4881 | // previous_safe is now our candidate 'earliest known place that seeking | |||
4882 | // to will lead to the final page' | |||
4883 | ||||
4884 | if (!vorbis_find_page(f, &end, (int unsigned *)&last)) { | |||
4885 | // if we can't find a page, we're hosed! | |||
4886 | f->error = VORBIS_cant_find_last_page; | |||
4887 | f->total_samples = 0xffffffff; | |||
4888 | goto done; | |||
4889 | } | |||
4890 | ||||
4891 | // check if there are more pages | |||
4892 | last_page_loc = stb_vorbis_get_file_offset(f); | |||
4893 | ||||
4894 | // stop when the last_page flag is set, not when we reach eof; | |||
4895 | // this allows us to stop short of a 'file_section' end without | |||
4896 | // explicitly checking the length of the section | |||
4897 | while (!last) { | |||
4898 | set_file_offset(f, end); | |||
4899 | if (!vorbis_find_page(f, &end, (int unsigned *)&last)) { | |||
4900 | // the last page we found didn't have the 'last page' flag | |||
4901 | // set. whoops! | |||
4902 | break; | |||
4903 | } | |||
4904 | previous_safe = last_page_loc+1; | |||
4905 | last_page_loc = stb_vorbis_get_file_offset(f); | |||
4906 | } | |||
4907 | ||||
4908 | set_file_offset(f, last_page_loc); | |||
4909 | ||||
4910 | // parse the header | |||
4911 | getn(f, (unsigned char *)header, 6); | |||
4912 | // extract the absolute granule position | |||
4913 | lo = get32(f); | |||
4914 | hi = get32(f); | |||
4915 | if (lo == 0xffffffff && hi == 0xffffffff) { | |||
4916 | f->error = VORBIS_cant_find_last_page; | |||
4917 | f->total_samples = SAMPLE_unknown0xffffffff; | |||
4918 | goto done; | |||
4919 | } | |||
4920 | if (hi) | |||
4921 | lo = 0xfffffffe; // saturate | |||
4922 | f->total_samples = lo; | |||
4923 | ||||
4924 | f->p_last.page_start = last_page_loc; | |||
4925 | f->p_last.page_end = end; | |||
4926 | f->p_last.last_decoded_sample = lo; | |||
4927 | f->p_last.first_decoded_sample = SAMPLE_unknown0xffffffff; | |||
4928 | f->p_last.after_previous_page_start = previous_safe; | |||
4929 | ||||
4930 | done: | |||
4931 | set_file_offset(f, restore_offset); | |||
4932 | } | |||
4933 | return f->total_samples == SAMPLE_unknown0xffffffff ? 0 : f->total_samples; | |||
4934 | } | |||
4935 | ||||
4936 | float stb_vorbis_stream_length_in_seconds(stb_vorbis *f) | |||
4937 | { | |||
4938 | return stb_vorbis_stream_length_in_samples(f) / (float) f->sample_rate; | |||
4939 | } | |||
4940 | ||||
4941 | ||||
4942 | ||||
4943 | int stb_vorbis_get_frame_float(stb_vorbis *f, int *channels, float ***output) | |||
4944 | { | |||
4945 | int len, right,left,i; | |||
4946 | if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); | |||
4947 | ||||
4948 | if (!vorbis_decode_packet(f, &len, &left, &right)) { | |||
4949 | f->channel_buffer_start = f->channel_buffer_end = 0; | |||
4950 | return 0; | |||
4951 | } | |||
4952 | ||||
4953 | len = vorbis_finish_frame(f, len, left, right); | |||
4954 | for (i=0; i < f->channels; ++i) | |||
4955 | f->outputs[i] = f->channel_buffers[i] + left; | |||
4956 | ||||
4957 | f->channel_buffer_start = left; | |||
4958 | f->channel_buffer_end = left+len; | |||
4959 | ||||
4960 | if (channels) *channels = f->channels; | |||
4961 | if (output) *output = f->outputs; | |||
4962 | return len; | |||
4963 | } | |||
4964 | ||||
4965 | #ifndef STB_VORBIS_NO_STDIO | |||
4966 | ||||
4967 | stb_vorbis * stb_vorbis_open_file_section(FILE *file, int close_on_free, int *error, stb_vorbis_alloc *alloc, unsigned int length) | |||
4968 | { | |||
4969 | stb_vorbis *f, p; | |||
4970 | vorbis_init(&p, alloc); | |||
4971 | p.f = file; | |||
4972 | p.f_start = ftell(file); | |||
4973 | p.stream_len = length; | |||
4974 | p.close_on_free = close_on_free; | |||
4975 | if (start_decoder(&p)) { | |||
4976 | f = vorbis_alloc(&p); | |||
4977 | if (f) { | |||
4978 | *f = p; | |||
4979 | vorbis_pump_first_frame(f); | |||
4980 | return f; | |||
4981 | } | |||
4982 | } | |||
4983 | if (error) *error = p.error; | |||
4984 | vorbis_deinit(&p); | |||
4985 | return NULL((void*)0); | |||
4986 | } | |||
4987 | ||||
4988 | stb_vorbis * stb_vorbis_open_file(FILE *file, int close_on_free, int *error, stb_vorbis_alloc *alloc) | |||
4989 | { | |||
4990 | unsigned int len, start; | |||
4991 | start = ftell(file); | |||
4992 | fseek(file, 0, SEEK_END2); | |||
4993 | len = ftell(file) - start; | |||
4994 | fseek(file, start, SEEK_SET0); | |||
4995 | return stb_vorbis_open_file_section(file, close_on_free, error, alloc, len); | |||
4996 | } | |||
4997 | ||||
4998 | stb_vorbis * stb_vorbis_open_filename(char *filename, int *error, stb_vorbis_alloc *alloc) | |||
4999 | { | |||
5000 | FILE *f = fopen(filename, "rb"); | |||
5001 | if (f) | |||
5002 | return stb_vorbis_open_file(f, TRUE1, error, alloc); | |||
5003 | if (error) *error = VORBIS_file_open_failure; | |||
5004 | return NULL((void*)0); | |||
5005 | } | |||
5006 | #endif // STB_VORBIS_NO_STDIO | |||
5007 | ||||
5008 | stb_vorbis * stb_vorbis_open_memory(unsigned char *data, int len, int *error, stb_vorbis_alloc *alloc) | |||
5009 | { | |||
5010 | stb_vorbis *f, p; | |||
5011 | if (data == NULL((void*)0)) return NULL((void*)0); | |||
5012 | vorbis_init(&p, alloc); | |||
5013 | p.stream = data; | |||
5014 | p.stream_end = data + len; | |||
5015 | p.stream_start = p.stream; | |||
5016 | p.stream_len = len; | |||
5017 | p.push_mode = FALSE0; | |||
5018 | if (start_decoder(&p)) { | |||
5019 | f = vorbis_alloc(&p); | |||
5020 | if (f) { | |||
5021 | *f = p; | |||
5022 | vorbis_pump_first_frame(f); | |||
5023 | return f; | |||
5024 | } | |||
5025 | } | |||
5026 | if (error) *error = p.error; | |||
5027 | vorbis_deinit(&p); | |||
5028 | return NULL((void*)0); | |||
5029 | } | |||
5030 | ||||
5031 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION | |||
5032 | #define PLAYBACK_MONO1 1 | |||
5033 | #define PLAYBACK_LEFT2 2 | |||
5034 | #define PLAYBACK_RIGHT4 4 | |||
5035 | ||||
5036 | #define L(2 | 1) (PLAYBACK_LEFT2 | PLAYBACK_MONO1) | |||
5037 | #define C(2 | 4 | 1) (PLAYBACK_LEFT2 | PLAYBACK_RIGHT4 | PLAYBACK_MONO1) | |||
5038 | #define R(4 | 1) (PLAYBACK_RIGHT4 | PLAYBACK_MONO1) | |||
5039 | ||||
5040 | static int8 channel_position[7][6] = | |||
5041 | { | |||
5042 | { 0 }, | |||
5043 | { C(2 | 4 | 1) }, | |||
5044 | { L(2 | 1), R(4 | 1) }, | |||
5045 | { L(2 | 1), C(2 | 4 | 1), R(4 | 1) }, | |||
5046 | { L(2 | 1), R(4 | 1), L(2 | 1), R(4 | 1) }, | |||
5047 | { L(2 | 1), C(2 | 4 | 1), R(4 | 1), L(2 | 1), R(4 | 1) }, | |||
5048 | { L(2 | 1), C(2 | 4 | 1), R(4 | 1), L(2 | 1), R(4 | 1), C(2 | 4 | 1) }, | |||
5049 | }; | |||
5050 | ||||
5051 | ||||
5052 | #ifndef STB_VORBIS_NO_FAST_SCALED_FLOAT | |||
5053 | typedef union { | |||
5054 | float f; | |||
5055 | int i; | |||
5056 | } float_conv; | |||
5057 | typedef char stb_vorbis_float_size_test[sizeof(float)==4 && sizeof(int) == 4]; | |||
5058 | #define FASTDEF(x)float_conv x float_conv x | |||
5059 | // add (1<<23) to convert to int, then divide by 2^SHIFT, then add 0.5/2^SHIFT to round | |||
5060 | #define MAGIC(SHIFT)(1.5f * (1 << (23-SHIFT)) + 0.5f/(1 << SHIFT)) (1.5f * (1 << (23-SHIFT)) + 0.5f/(1 << SHIFT)) | |||
5061 | #define ADDEND(SHIFT)(((150-SHIFT) << 23) + (1 << 22)) (((150-SHIFT) << 23) + (1 << 22)) | |||
5062 | #define FAST_SCALED_FLOAT_TO_INT(temp,x,s)(temp.f = (x) + (1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - (((150-s) << 23) + (1 << 22))) (temp.f = (x) + MAGIC(s)(1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - ADDEND(s)(((150-s) << 23) + (1 << 22))) | |||
5063 | #define check_endianness() | |||
5064 | #else | |||
5065 | #define FAST_SCALED_FLOAT_TO_INT(temp,x,s)(temp.f = (x) + (1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - (((150-s) << 23) + (1 << 22))) ((int) ((x) * (1 << (s)))) | |||
5066 | #define check_endianness() | |||
5067 | #define FASTDEF(x)float_conv x | |||
5068 | #endif | |||
5069 | ||||
5070 | static void copy_samples(short *dest, float *src, int len) | |||
5071 | { | |||
5072 | int i; | |||
5073 | check_endianness(); | |||
5074 | for (i=0; i < len; ++i) { | |||
5075 | FASTDEF(temp)float_conv temp; | |||
5076 | int v = FAST_SCALED_FLOAT_TO_INT(temp, src[i],15)(temp.f = (src[i]) + (1.5f * (1 << (23-15)) + 0.5f/(1 << 15)), temp.i - (((150-15) << 23) + (1 << 22))); | |||
5077 | if ((unsigned int) (v + 32768) > 65535) | |||
5078 | v = v < 0 ? -32768 : 32767; | |||
5079 | dest[i] = v; | |||
5080 | } | |||
5081 | } | |||
5082 | ||||
5083 | static void compute_samples(int mask, short *output, int num_c, float **data, int d_offset, int len) | |||
5084 | { | |||
5085 | #define BUFFER_SIZE32 32 | |||
5086 | float buffer[BUFFER_SIZE32]; | |||
5087 | int i,j,o,n = BUFFER_SIZE32; | |||
5088 | check_endianness(); | |||
5089 | for (o = 0; o < len; o += BUFFER_SIZE32) { | |||
5090 | memset(buffer, 0, sizeof(buffer)); | |||
5091 | if (o + n > len) n = len - o; | |||
5092 | for (j=0; j < num_c; ++j) { | |||
5093 | if (channel_position[num_c][j] & mask) { | |||
5094 | for (i=0; i < n; ++i) | |||
5095 | buffer[i] += data[j][d_offset+o+i]; | |||
5096 | } | |||
5097 | } | |||
5098 | for (i=0; i < n; ++i) { | |||
5099 | FASTDEF(temp)float_conv temp; | |||
5100 | int v = FAST_SCALED_FLOAT_TO_INT(temp,buffer[i],15)(temp.f = (buffer[i]) + (1.5f * (1 << (23-15)) + 0.5f/( 1 << 15)), temp.i - (((150-15) << 23) + (1 << 22))); | |||
5101 | if ((unsigned int) (v + 32768) > 65535) | |||
5102 | v = v < 0 ? -32768 : 32767; | |||
5103 | output[o+i] = v; | |||
5104 | } | |||
5105 | } | |||
5106 | } | |||
5107 | ||||
5108 | static int channel_selector[3][2] = { {0}, {PLAYBACK_MONO1}, {PLAYBACK_LEFT2, PLAYBACK_RIGHT4} }; | |||
5109 | static void compute_stereo_samples(short *output, int num_c, float **data, int d_offset, int len) | |||
5110 | { | |||
5111 | #define BUFFER_SIZE32 32 | |||
5112 | float buffer[BUFFER_SIZE32]; | |||
5113 | int i,j,o,n = BUFFER_SIZE32 >> 1; | |||
5114 | // o is the offset in the source data | |||
5115 | check_endianness(); | |||
5116 | for (o = 0; o < len; o += BUFFER_SIZE32 >> 1) { | |||
5117 | // o2 is the offset in the output data | |||
5118 | int o2 = o << 1; | |||
5119 | memset(buffer, 0, sizeof(buffer)); | |||
5120 | if (o + n > len) n = len - o; | |||
5121 | for (j=0; j < num_c; ++j) { | |||
5122 | int m = channel_position[num_c][j] & (PLAYBACK_LEFT2 | PLAYBACK_RIGHT4); | |||
5123 | if (m == (PLAYBACK_LEFT2 | PLAYBACK_RIGHT4)) { | |||
5124 | for (i=0; i < n; ++i) { | |||
5125 | buffer[i*2+0] += data[j][d_offset+o+i]; | |||
5126 | buffer[i*2+1] += data[j][d_offset+o+i]; | |||
5127 | } | |||
5128 | } else if (m == PLAYBACK_LEFT2) { | |||
5129 | for (i=0; i < n; ++i) { | |||
5130 | buffer[i*2+0] += data[j][d_offset+o+i]; | |||
5131 | } | |||
5132 | } else if (m == PLAYBACK_RIGHT4) { | |||
5133 | for (i=0; i < n; ++i) { | |||
5134 | buffer[i*2+1] += data[j][d_offset+o+i]; | |||
5135 | } | |||
5136 | } | |||
5137 | } | |||
5138 | for (i=0; i < (n<<1); ++i) { | |||
5139 | FASTDEF(temp)float_conv temp; | |||
5140 | int v = FAST_SCALED_FLOAT_TO_INT(temp,buffer[i],15)(temp.f = (buffer[i]) + (1.5f * (1 << (23-15)) + 0.5f/( 1 << 15)), temp.i - (((150-15) << 23) + (1 << 22))); | |||
5141 | if ((unsigned int) (v + 32768) > 65535) | |||
5142 | v = v < 0 ? -32768 : 32767; | |||
5143 | output[o2+i] = v; | |||
5144 | } | |||
5145 | } | |||
5146 | } | |||
5147 | ||||
5148 | static void convert_samples_short(int buf_c, short **buffer, int b_offset, int data_c, float **data, int d_offset, int samples) | |||
5149 | { | |||
5150 | int i; | |||
5151 | if (buf_c != data_c && buf_c <= 2 && data_c <= 6) { | |||
5152 | static int channel_selector[3][2] = { {0}, {PLAYBACK_MONO1}, {PLAYBACK_LEFT2, PLAYBACK_RIGHT4} }; | |||
5153 | for (i=0; i < buf_c; ++i) | |||
5154 | compute_samples(channel_selector[buf_c][i], buffer[i]+b_offset, data_c, data, d_offset, samples); | |||
5155 | } else { | |||
5156 | int limit = buf_c < data_c ? buf_c : data_c; | |||
5157 | for (i=0; i < limit; ++i) | |||
5158 | copy_samples(buffer[i]+b_offset, data[i], samples); | |||
5159 | for ( ; i < buf_c; ++i) | |||
5160 | memset(buffer[i]+b_offset, 0, sizeof(short) * samples); | |||
5161 | } | |||
5162 | } | |||
5163 | ||||
5164 | int stb_vorbis_get_frame_short(stb_vorbis *f, int num_c, short **buffer, int num_samples) | |||
5165 | { | |||
5166 | float **output; | |||
5167 | int len = stb_vorbis_get_frame_float(f, NULL((void*)0), &output); | |||
5168 | if (len > num_samples) len = num_samples; | |||
5169 | if (len) | |||
5170 | convert_samples_short(num_c, buffer, 0, f->channels, output, 0, len); | |||
5171 | return len; | |||
5172 | } | |||
5173 | ||||
5174 | static void convert_channels_short_interleaved(int buf_c, short *buffer, int data_c, float **data, int d_offset, int len) | |||
5175 | { | |||
5176 | int i; | |||
5177 | check_endianness(); | |||
5178 | if (buf_c != data_c && buf_c <= 2 && data_c <= 6) { | |||
5179 | assert(buf_c == 2)((buf_c == 2) ? (void)0 : _assert("buf_c == 2", "src/siege/internal/stb/stb_vorbis.c" , 5179)); | |||
5180 | for (i=0; i < buf_c; ++i) | |||
5181 | compute_stereo_samples(buffer, data_c, data, d_offset, len); | |||
5182 | } else { | |||
5183 | int limit = buf_c < data_c ? buf_c : data_c; | |||
5184 | int j; | |||
5185 | for (j=0; j < len; ++j) { | |||
5186 | for (i=0; i < limit; ++i) { | |||
5187 | FASTDEF(temp)float_conv temp; | |||
5188 | float f = data[i][d_offset+j]; | |||
5189 | int v = FAST_SCALED_FLOAT_TO_INT(temp, f,15)(temp.f = (f) + (1.5f * (1 << (23-15)) + 0.5f/(1 << 15)), temp.i - (((150-15) << 23) + (1 << 22)));//data[i][d_offset+j],15); | |||
5190 | if ((unsigned int) (v + 32768) > 65535) | |||
5191 | v = v < 0 ? -32768 : 32767; | |||
5192 | *buffer++ = v; | |||
5193 | } | |||
5194 | for ( ; i < buf_c; ++i) | |||
5195 | *buffer++ = 0; | |||
5196 | } | |||
5197 | } | |||
5198 | } | |||
5199 | ||||
5200 | int stb_vorbis_get_frame_short_interleaved(stb_vorbis *f, int num_c, short *buffer, int num_shorts) | |||
5201 | { | |||
5202 | float **output; | |||
5203 | int len; | |||
5204 | if (num_c == 1) return stb_vorbis_get_frame_short(f,num_c,&buffer, num_shorts); | |||
5205 | len = stb_vorbis_get_frame_float(f, NULL((void*)0), &output); | |||
5206 | if (len) { | |||
5207 | if (len*num_c > num_shorts) len = num_shorts / num_c; | |||
5208 | convert_channels_short_interleaved(num_c, buffer, f->channels, output, 0, len); | |||
5209 | } | |||
5210 | return len; | |||
5211 | } | |||
5212 | ||||
5213 | int stb_vorbis_get_samples_short_interleaved(stb_vorbis *f, int channels, short *buffer, int num_shorts) | |||
5214 | { | |||
5215 | float **outputs; | |||
5216 | int len = num_shorts / channels; | |||
5217 | int n=0; | |||
5218 | int z = f->channels; | |||
5219 | if (z > channels) z = channels; | |||
5220 | while (n < len) { | |||
5221 | int k = f->channel_buffer_end - f->channel_buffer_start; | |||
5222 | if (n+k >= len) k = len - n; | |||
5223 | if (k) | |||
5224 | convert_channels_short_interleaved(channels, buffer, f->channels, f->channel_buffers, f->channel_buffer_start, k); | |||
5225 | buffer += k*channels; | |||
5226 | n += k; | |||
5227 | f->channel_buffer_start += k; | |||
5228 | if (n == len) break; | |||
5229 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; | |||
5230 | } | |||
5231 | return n; | |||
5232 | } | |||
5233 | ||||
5234 | int stb_vorbis_get_samples_short(stb_vorbis *f, int channels, short **buffer, int len) | |||
5235 | { | |||
5236 | float **outputs; | |||
5237 | int n=0; | |||
5238 | int z = f->channels; | |||
5239 | if (z > channels) z = channels; | |||
5240 | while (n < len) { | |||
5241 | int k = f->channel_buffer_end - f->channel_buffer_start; | |||
5242 | if (n+k >= len) k = len - n; | |||
5243 | if (k) | |||
5244 | convert_samples_short(channels, buffer, n, f->channels, f->channel_buffers, f->channel_buffer_start, k); | |||
5245 | n += k; | |||
5246 | f->channel_buffer_start += k; | |||
5247 | if (n == len) break; | |||
5248 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; | |||
5249 | } | |||
5250 | return n; | |||
5251 | } | |||
5252 | ||||
5253 | #ifndef STB_VORBIS_NO_STDIO | |||
5254 | int stb_vorbis_decode_filename(char *filename, int *channels, short **output) | |||
5255 | { | |||
5256 | int data_len, offset, total, limit, error; | |||
5257 | short *data; | |||
5258 | stb_vorbis *v = stb_vorbis_open_filename(filename, &error, NULL((void*)0)); | |||
5259 | if (v == NULL((void*)0)) return -1; | |||
5260 | limit = v->channels * 4096; | |||
5261 | *channels = v->channels; | |||
5262 | offset = data_len = 0; | |||
5263 | total = limit; | |||
5264 | data = (short *) malloc(total * sizeof(*data)); | |||
5265 | if (data == NULL((void*)0)) { | |||
5266 | stb_vorbis_close(v); | |||
5267 | return -2; | |||
5268 | } | |||
5269 | for (;;) { | |||
5270 | int n = stb_vorbis_get_frame_short_interleaved(v, v->channels, data+offset, total-offset); | |||
5271 | if (n == 0) break; | |||
5272 | data_len += n; | |||
5273 | offset += n * v->channels; | |||
5274 | if (offset + limit > total) { | |||
5275 | short *data2; | |||
5276 | total *= 2; | |||
5277 | data2 = (short *) realloc(data, total * sizeof(*data)); | |||
5278 | if (data2 == NULL((void*)0)) { | |||
5279 | free(data); | |||
5280 | stb_vorbis_close(v); | |||
5281 | return -2; | |||
5282 | } | |||
5283 | data = data2; | |||
5284 | } | |||
5285 | } | |||
5286 | *output = data; | |||
5287 | return data_len; | |||
5288 | } | |||
5289 | #endif // NO_STDIO | |||
5290 | ||||
5291 | int stb_vorbis_decode_memory(uint8 *mem, int len, int *channels, short **output) | |||
5292 | { | |||
5293 | int data_len, offset, total, limit, error; | |||
5294 | short *data; | |||
5295 | stb_vorbis *v = stb_vorbis_open_memory(mem, len, &error, NULL((void*)0)); | |||
5296 | if (v == NULL((void*)0)) return -1; | |||
5297 | limit = v->channels * 4096; | |||
5298 | *channels = v->channels; | |||
5299 | offset = data_len = 0; | |||
5300 | total = limit; | |||
5301 | data = (short *) malloc(total * sizeof(*data)); | |||
5302 | if (data == NULL((void*)0)) { | |||
5303 | stb_vorbis_close(v); | |||
5304 | return -2; | |||
5305 | } | |||
5306 | for (;;) { | |||
5307 | int n = stb_vorbis_get_frame_short_interleaved(v, v->channels, data+offset, total-offset); | |||
5308 | if (n == 0) break; | |||
5309 | data_len += n; | |||
5310 | offset += n * v->channels; | |||
5311 | if (offset + limit > total) { | |||
5312 | short *data2; | |||
5313 | total *= 2; | |||
5314 | data2 = (short *) realloc(data, total * sizeof(*data)); | |||
5315 | if (data2 == NULL((void*)0)) { | |||
5316 | free(data); | |||
5317 | stb_vorbis_close(v); | |||
5318 | return -2; | |||
5319 | } | |||
5320 | data = data2; | |||
5321 | } | |||
5322 | } | |||
5323 | *output = data; | |||
5324 | return data_len; | |||
5325 | } | |||
5326 | #endif | |||
5327 | ||||
5328 | int stb_vorbis_get_samples_float_interleaved(stb_vorbis *f, int channels, float *buffer, int num_floats) | |||
5329 | { | |||
5330 | float **outputs; | |||
5331 | int len = num_floats / channels; | |||
5332 | int n=0; | |||
5333 | int z = f->channels; | |||
5334 | if (z > channels) z = channels; | |||
5335 | while (n < len) { | |||
5336 | int i,j; | |||
5337 | int k = f->channel_buffer_end - f->channel_buffer_start; | |||
5338 | if (n+k >= len) k = len - n; | |||
5339 | for (j=0; j < k; ++j) { | |||
5340 | for (i=0; i < z; ++i) | |||
5341 | *buffer++ = f->channel_buffers[i][f->channel_buffer_start+j]; | |||
5342 | for ( ; i < channels; ++i) | |||
5343 | *buffer++ = 0; | |||
5344 | } | |||
5345 | n += k; | |||
5346 | f->channel_buffer_start += k; | |||
5347 | if (n == len) break; | |||
5348 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; | |||
5349 | } | |||
5350 | return n; | |||
5351 | } | |||
5352 | ||||
5353 | int stb_vorbis_get_samples_float(stb_vorbis *f, int channels, float **buffer, int num_samples) | |||
5354 | { | |||
5355 | float **outputs; | |||
5356 | int n=0; | |||
5357 | int z = f->channels; | |||
5358 | if (z > channels) z = channels; | |||
5359 | while (n < num_samples) { | |||
5360 | int i; | |||
5361 | int k = f->channel_buffer_end - f->channel_buffer_start; | |||
5362 | if (n+k >= num_samples) k = num_samples - n; | |||
5363 | if (k) { | |||
5364 | for (i=0; i < z; ++i) | |||
5365 | memcpy(buffer[i]+n, f->channel_buffers+f->channel_buffer_start, sizeof(float)*k); | |||
5366 | for ( ; i < channels; ++i) | |||
5367 | memset(buffer[i]+n, 0, sizeof(float) * k); | |||
5368 | } | |||
5369 | n += k; | |||
5370 | f->channel_buffer_start += k; | |||
5371 | if (n == num_samples) break; | |||
5372 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; | |||
5373 | } | |||
5374 | return n; | |||
5375 | } | |||
5376 | #endif // STB_VORBIS_NO_PULLDATA_API | |||
5377 | ||||
5378 | void _dummyFunction(void) | |||
5379 | { | |||
5380 | (void)get_bits_signed; | |||
5381 | (void)codebook_decode_scalar; | |||
5382 | (void)channel_selector; | |||
5383 | } | |||
5384 | ||||
5385 | #endif // STB_VORBIS_HEADER_ONLY |