File: | c:\siege\siege/src/siege/internal/stb/stb_vorbis.c |
Location: | line 5239, column 22 |
Description: | Value stored to 'z' is never read |
1 | // Ogg Vorbis I audio decoder -- version 0.99996 |
2 | // |
3 | // Written in April 2007 by Sean Barrett, sponsored by RAD Game Tools. |
4 | // |
5 | // Placed in the public domain April 2007 by the author: no copyright is |
6 | // claimed, and you may use it for any purpose you like. |
7 | // |
8 | // No warranty for any purpose is expressed or implied by the author (nor |
9 | // by RAD Game Tools). Report bugs and send enhancements to the author. |
10 | // |
11 | // Get the latest version and other information at: |
12 | // http://nothings.org/stb_vorbis/ |
13 | |
14 | |
15 | // Todo: |
16 | // |
17 | // - seeking (note you can seek yourself using the pushdata API) |
18 | // |
19 | // Limitations: |
20 | // |
21 | // - floor 0 not supported (used in old ogg vorbis files) |
22 | // - lossless sample-truncation at beginning ignored |
23 | // - cannot concatenate multiple vorbis streams |
24 | // - sample positions are 32-bit, limiting seekable 192Khz |
25 | // files to around 6 hours (Ogg supports 64-bit) |
26 | // |
27 | // All of these limitations may be removed in future versions. |
28 | |
29 | |
30 | ////////////////////////////////////////////////////////////////////////////// |
31 | // |
32 | // HEADER BEGINS HERE |
33 | // |
34 | |
35 | #ifndef STB_VORBIS_INCLUDE_STB_VORBIS_H |
36 | #define STB_VORBIS_INCLUDE_STB_VORBIS_H |
37 | |
38 | #if defined(STB_VORBIS_NO_CRT) && !defined(STB_VORBIS_NO_STDIO) |
39 | #define STB_VORBIS_NO_STDIO 1 |
40 | #endif |
41 | |
42 | #ifndef STB_VORBIS_NO_STDIO |
43 | #include <stdio.h> |
44 | #endif |
45 | |
46 | #ifdef __cplusplus |
47 | extern "C" { |
48 | #endif |
49 | |
50 | /////////// THREAD SAFETY |
51 | |
52 | // Individual stb_vorbis* handles are not thread-safe; you cannot decode from |
53 | // them from multiple threads at the same time. However, you can have multiple |
54 | // stb_vorbis* handles and decode from them independently in multiple thrads. |
55 | |
56 | |
57 | /////////// MEMORY ALLOCATION |
58 | |
59 | // normally stb_vorbis uses malloc() to allocate memory at startup, |
60 | // and alloca() to allocate temporary memory during a frame on the |
61 | // stack. (Memory consumption will depend on the amount of setup |
62 | // data in the file and how you set the compile flags for speed |
63 | // vs. size. In my test files the maximal-size usage is ~150KB.) |
64 | // |
65 | // You can modify the wrapper functions in the source (setup_malloc, |
66 | // setup_temp_malloc, temp_malloc) to change this behavior, or you |
67 | // can use a simpler allocation model: you pass in a buffer from |
68 | // which stb_vorbis will allocate _all_ its memory (including the |
69 | // temp memory). "open" may fail with a VORBIS_outofmem if you |
70 | // do not pass in enough data; there is no way to determine how |
71 | // much you do need except to succeed (at which point you can |
72 | // query get_info to find the exact amount required. yes I know |
73 | // this is lame). |
74 | // |
75 | // If you pass in a non-NULL buffer of the type below, allocation |
76 | // will occur from it as described above. Otherwise just pass NULL |
77 | // to use malloc()/alloca() |
78 | |
79 | typedef struct |
80 | { |
81 | char *alloc_buffer; |
82 | int alloc_buffer_length_in_bytes; |
83 | } stb_vorbis_alloc; |
84 | |
85 | |
86 | /////////// FUNCTIONS USEABLE WITH ALL INPUT MODES |
87 | |
88 | typedef struct stb_vorbis stb_vorbis; |
89 | |
90 | typedef struct |
91 | { |
92 | unsigned int sample_rate; |
93 | int channels; |
94 | |
95 | unsigned int setup_memory_required; |
96 | unsigned int setup_temp_memory_required; |
97 | unsigned int temp_memory_required; |
98 | |
99 | int max_frame_size; |
100 | } stb_vorbis_info; |
101 | |
102 | // get general information about the file |
103 | extern stb_vorbis_info stb_vorbis_get_info(stb_vorbis *f); |
104 | |
105 | // get the last error detected (clears it, too) |
106 | extern int stb_vorbis_get_error(stb_vorbis *f); |
107 | |
108 | // close an ogg vorbis file and free all memory in use |
109 | extern void stb_vorbis_close(stb_vorbis *f); |
110 | |
111 | // this function returns the offset (in samples) from the beginning of the |
112 | // file that will be returned by the next decode, if it is known, or -1 |
113 | // otherwise. after a flush_pushdata() call, this may take a while before |
114 | // it becomes valid again. |
115 | // NOT WORKING YET after a seek with PULLDATA API |
116 | extern int stb_vorbis_get_sample_offset(stb_vorbis *f); |
117 | |
118 | // returns the current seek point within the file, or offset from the beginning |
119 | // of the memory buffer. In pushdata mode it returns 0. |
120 | extern unsigned int stb_vorbis_get_file_offset(stb_vorbis *f); |
121 | |
122 | /////////// PUSHDATA API |
123 | |
124 | #ifndef STB_VORBIS_NO_PUSHDATA_API |
125 | |
126 | // this API allows you to get blocks of data from any source and hand |
127 | // them to stb_vorbis. you have to buffer them; stb_vorbis will tell |
128 | // you how much it used, and you have to give it the rest next time; |
129 | // and stb_vorbis may not have enough data to work with and you will |
130 | // need to give it the same data again PLUS more. Note that the Vorbis |
131 | // specification does not bound the size of an individual frame. |
132 | |
133 | extern stb_vorbis *stb_vorbis_open_pushdata( |
134 | unsigned char *datablock, int datablock_length_in_bytes, |
135 | int *datablock_memory_consumed_in_bytes, |
136 | int *error, |
137 | stb_vorbis_alloc *alloc_buffer); |
138 | // create a vorbis decoder by passing in the initial data block containing |
139 | // the ogg&vorbis headers (you don't need to do parse them, just provide |
140 | // the first N bytes of the file--you're told if it's not enough, see below) |
141 | // on success, returns an stb_vorbis *, does not set error, returns the amount of |
142 | // data parsed/consumed on this call in *datablock_memory_consumed_in_bytes; |
143 | // on failure, returns NULL on error and sets *error, does not change *datablock_memory_consumed |
144 | // if returns NULL and *error is VORBIS_need_more_data, then the input block was |
145 | // incomplete and you need to pass in a larger block from the start of the file |
146 | |
147 | extern int stb_vorbis_decode_frame_pushdata( |
148 | stb_vorbis *f, unsigned char *datablock, int datablock_length_in_bytes, |
149 | int *channels, // place to write number of float * buffers |
150 | float ***output, // place to write float ** array of float * buffers |
151 | int *samples // place to write number of output samples |
152 | ); |
153 | // decode a frame of audio sample data if possible from the passed-in data block |
154 | // |
155 | // return value: number of bytes we used from datablock |
156 | // possible cases: |
157 | // 0 bytes used, 0 samples output (need more data) |
158 | // N bytes used, 0 samples output (resynching the stream, keep going) |
159 | // N bytes used, M samples output (one frame of data) |
160 | // note that after opening a file, you will ALWAYS get one N-bytes,0-sample |
161 | // frame, because Vorbis always "discards" the first frame. |
162 | // |
163 | // Note that on resynch, stb_vorbis will rarely consume all of the buffer, |
164 | // instead only datablock_length_in_bytes-3 or less. This is because it wants |
165 | // to avoid missing parts of a page header if they cross a datablock boundary, |
166 | // without writing state-machiney code to record a partial detection. |
167 | // |
168 | // The number of channels returned are stored in *channels (which can be |
169 | // NULL--it is always the same as the number of channels reported by |
170 | // get_info). *output will contain an array of float* buffers, one per |
171 | // channel. In other words, (*output)[0][0] contains the first sample from |
172 | // the first channel, and (*output)[1][0] contains the first sample from |
173 | // the second channel. |
174 | |
175 | extern void stb_vorbis_flush_pushdata(stb_vorbis *f); |
176 | // inform stb_vorbis that your next datablock will not be contiguous with |
177 | // previous ones (e.g. you've seeked in the data); future attempts to decode |
178 | // frames will cause stb_vorbis to resynchronize (as noted above), and |
179 | // once it sees a valid Ogg page (typically 4-8KB, as large as 64KB), it |
180 | // will begin decoding the _next_ frame. |
181 | // |
182 | // if you want to seek using pushdata, you need to seek in your file, then |
183 | // call stb_vorbis_flush_pushdata(), then start calling decoding, then once |
184 | // decoding is returning you data, call stb_vorbis_get_sample_offset, and |
185 | // if you don't like the result, seek your file again and repeat. |
186 | #endif |
187 | |
188 | |
189 | ////////// PULLING INPUT API |
190 | |
191 | #ifndef STB_VORBIS_NO_PULLDATA_API |
192 | // This API assumes stb_vorbis is allowed to pull data from a source-- |
193 | // either a block of memory containing the _entire_ vorbis stream, or a |
194 | // FILE * that you or it create, or possibly some other reading mechanism |
195 | // if you go modify the source to replace the FILE * case with some kind |
196 | // of callback to your code. (But if you don't support seeking, you may |
197 | // just want to go ahead and use pushdata.) |
198 | |
199 | #if !defined(STB_VORBIS_NO_STDIO) && !defined(STB_VORBIS_NO_INTEGER_CONVERSION) |
200 | extern int stb_vorbis_decode_filename(char *filename, int *channels, short **output); |
201 | #endif |
202 | extern int stb_vorbis_decode_memory(unsigned char *mem, int len, int *channels, short **output); |
203 | // decode an entire file and output the data interleaved into a malloc()ed |
204 | // buffer stored in *output. The return value is the number of samples |
205 | // decoded, or -1 if the file could not be opened or was not an ogg vorbis file. |
206 | // When you're done with it, just free() the pointer returned in *output. |
207 | |
208 | extern stb_vorbis * stb_vorbis_open_memory(unsigned char *data, int len, |
209 | int *error, stb_vorbis_alloc *alloc_buffer); |
210 | // create an ogg vorbis decoder from an ogg vorbis stream in memory (note |
211 | // this must be the entire stream!). on failure, returns NULL and sets *error |
212 | |
213 | #ifndef STB_VORBIS_NO_STDIO |
214 | extern stb_vorbis * stb_vorbis_open_filename(char *filename, |
215 | int *error, stb_vorbis_alloc *alloc_buffer); |
216 | // create an ogg vorbis decoder from a filename via fopen(). on failure, |
217 | // returns NULL and sets *error (possibly to VORBIS_file_open_failure). |
218 | |
219 | extern stb_vorbis * stb_vorbis_open_file(FILE *f, int close_handle_on_close, |
220 | int *error, stb_vorbis_alloc *alloc_buffer); |
221 | // create an ogg vorbis decoder from an open FILE *, looking for a stream at |
222 | // the _current_ seek point (ftell). on failure, returns NULL and sets *error. |
223 | // note that stb_vorbis must "own" this stream; if you seek it in between |
224 | // calls to stb_vorbis, it will become confused. Morever, if you attempt to |
225 | // perform stb_vorbis_seek_*() operations on this file, it will assume it |
226 | // owns the _entire_ rest of the file after the start point. Use the next |
227 | // function, stb_vorbis_open_file_section(), to limit it. |
228 | |
229 | extern stb_vorbis * stb_vorbis_open_file_section(FILE *f, int close_handle_on_close, |
230 | int *error, stb_vorbis_alloc *alloc_buffer, unsigned int len); |
231 | // create an ogg vorbis decoder from an open FILE *, looking for a stream at |
232 | // the _current_ seek point (ftell); the stream will be of length 'len' bytes. |
233 | // on failure, returns NULL and sets *error. note that stb_vorbis must "own" |
234 | // this stream; if you seek it in between calls to stb_vorbis, it will become |
235 | // confused. |
236 | #endif |
237 | |
238 | extern int stb_vorbis_seek_frame(stb_vorbis *f, unsigned int sample_number); |
239 | extern int stb_vorbis_seek(stb_vorbis *f, unsigned int sample_number); |
240 | // NOT WORKING YET |
241 | // these functions seek in the Vorbis file to (approximately) 'sample_number'. |
242 | // after calling seek_frame(), the next call to get_frame_*() will include |
243 | // the specified sample. after calling stb_vorbis_seek(), the next call to |
244 | // stb_vorbis_get_samples_* will start with the specified sample. If you |
245 | // do not need to seek to EXACTLY the target sample when using get_samples_*, |
246 | // you can also use seek_frame(). |
247 | |
248 | extern void stb_vorbis_seek_start(stb_vorbis *f); |
249 | // this function is equivalent to stb_vorbis_seek(f,0), but it |
250 | // actually works |
251 | |
252 | extern unsigned int stb_vorbis_stream_length_in_samples(stb_vorbis *f); |
253 | extern float stb_vorbis_stream_length_in_seconds(stb_vorbis *f); |
254 | // these functions return the total length of the vorbis stream |
255 | |
256 | extern int stb_vorbis_get_frame_float(stb_vorbis *f, int *channels, float ***output); |
257 | // decode the next frame and return the number of samples. the number of |
258 | // channels returned are stored in *channels (which can be NULL--it is always |
259 | // the same as the number of channels reported by get_info). *output will |
260 | // contain an array of float* buffers, one per channel. These outputs will |
261 | // be overwritten on the next call to stb_vorbis_get_frame_*. |
262 | // |
263 | // You generally should not intermix calls to stb_vorbis_get_frame_*() |
264 | // and stb_vorbis_get_samples_*(), since the latter calls the former. |
265 | |
266 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION |
267 | extern int stb_vorbis_get_frame_short_interleaved(stb_vorbis *f, int num_c, short *buffer, int num_shorts); |
268 | extern int stb_vorbis_get_frame_short (stb_vorbis *f, int num_c, short **buffer, int num_samples); |
269 | #endif |
270 | // decode the next frame and return the number of samples per channel. the |
271 | // data is coerced to the number of channels you request according to the |
272 | // channel coercion rules (see below). You must pass in the size of your |
273 | // buffer(s) so that stb_vorbis will not overwrite the end of the buffer. |
274 | // The maximum buffer size needed can be gotten from get_info(); however, |
275 | // the Vorbis I specification implies an absolute maximum of 4096 samples |
276 | // per channel. Note that for interleaved data, you pass in the number of |
277 | // shorts (the size of your array), but the return value is the number of |
278 | // samples per channel, not the total number of samples. |
279 | |
280 | // Channel coercion rules: |
281 | // Let M be the number of channels requested, and N the number of channels present, |
282 | // and Cn be the nth channel; let stereo L be the sum of all L and center channels, |
283 | // and stereo R be the sum of all R and center channels (channel assignment from the |
284 | // vorbis spec). |
285 | // M N output |
286 | // 1 k sum(Ck) for all k |
287 | // 2 * stereo L, stereo R |
288 | // k l k > l, the first l channels, then 0s |
289 | // k l k <= l, the first k channels |
290 | // Note that this is not _good_ surround etc. mixing at all! It's just so |
291 | // you get something useful. |
292 | |
293 | extern int stb_vorbis_get_samples_float_interleaved(stb_vorbis *f, int channels, float *buffer, int num_floats); |
294 | extern int stb_vorbis_get_samples_float(stb_vorbis *f, int channels, float **buffer, int num_samples); |
295 | // gets num_samples samples, not necessarily on a frame boundary--this requires |
296 | // buffering so you have to supply the buffers. DOES NOT APPLY THE COERCION RULES. |
297 | // Returns the number of samples stored per channel; it may be less than requested |
298 | // at the end of the file. If there are no more samples in the file, returns 0. |
299 | |
300 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION |
301 | extern int stb_vorbis_get_samples_short_interleaved(stb_vorbis *f, int channels, short *buffer, int num_shorts); |
302 | extern int stb_vorbis_get_samples_short(stb_vorbis *f, int channels, short **buffer, int num_samples); |
303 | #endif |
304 | // gets num_samples samples, not necessarily on a frame boundary--this requires |
305 | // buffering so you have to supply the buffers. Applies the coercion rules above |
306 | // to produce 'channels' channels. Returns the number of samples stored per channel; |
307 | // it may be less than requested at the end of the file. If there are no more |
308 | // samples in the file, returns 0. |
309 | |
310 | #endif |
311 | |
312 | //////// ERROR CODES |
313 | |
314 | enum STBVorbisError |
315 | { |
316 | VORBIS__no_error, |
317 | |
318 | VORBIS_need_more_data=1, // not a real error |
319 | |
320 | VORBIS_invalid_api_mixing, // can't mix API modes |
321 | VORBIS_outofmem, // not enough memory |
322 | VORBIS_feature_not_supported, // uses floor 0 |
323 | VORBIS_too_many_channels, // STB_VORBIS_MAX_CHANNELS is too small |
324 | VORBIS_file_open_failure, // fopen() failed |
325 | VORBIS_seek_without_length, // can't seek in unknown-length file |
326 | |
327 | VORBIS_unexpected_eof=10, // file is truncated? |
328 | VORBIS_seek_invalid, // seek past EOF |
329 | |
330 | // decoding errors (corrupt/invalid stream) -- you probably |
331 | // don't care about the exact details of these |
332 | |
333 | // vorbis errors: |
334 | VORBIS_invalid_setup=20, |
335 | VORBIS_invalid_stream, |
336 | |
337 | // ogg errors: |
338 | VORBIS_missing_capture_pattern=30, |
339 | VORBIS_invalid_stream_structure_version, |
340 | VORBIS_continued_packet_flag_invalid, |
341 | VORBIS_incorrect_stream_serial_number, |
342 | VORBIS_invalid_first_page, |
343 | VORBIS_bad_packet_type, |
344 | VORBIS_cant_find_last_page, |
345 | VORBIS_seek_failed, |
346 | }; |
347 | |
348 | |
349 | #ifdef __cplusplus |
350 | } |
351 | #endif |
352 | |
353 | #endif // STB_VORBIS_INCLUDE_STB_VORBIS_H |
354 | // |
355 | // HEADER ENDS HERE |
356 | // |
357 | ////////////////////////////////////////////////////////////////////////////// |
358 | |
359 | #ifndef STB_VORBIS_HEADER_ONLY |
360 | |
361 | // global configuration settings (e.g. set these in the project/makefile), |
362 | // or just set them in this file at the top (although ideally the first few |
363 | // should be visible when the header file is compiled too, although it's not |
364 | // crucial) |
365 | |
366 | // STB_VORBIS_NO_PUSHDATA_API |
367 | // does not compile the code for the various stb_vorbis_*_pushdata() |
368 | // functions |
369 | // #define STB_VORBIS_NO_PUSHDATA_API |
370 | |
371 | // STB_VORBIS_NO_PULLDATA_API |
372 | // does not compile the code for the non-pushdata APIs |
373 | // #define STB_VORBIS_NO_PULLDATA_API |
374 | |
375 | // STB_VORBIS_NO_STDIO |
376 | // does not compile the code for the APIs that use FILE *s internally |
377 | // or externally (implied by STB_VORBIS_NO_PULLDATA_API) |
378 | // #define STB_VORBIS_NO_STDIO |
379 | |
380 | // STB_VORBIS_NO_INTEGER_CONVERSION |
381 | // does not compile the code for converting audio sample data from |
382 | // float to integer (implied by STB_VORBIS_NO_PULLDATA_API) |
383 | // #define STB_VORBIS_NO_INTEGER_CONVERSION |
384 | |
385 | // STB_VORBIS_NO_FAST_SCALED_FLOAT |
386 | // does not use a fast float-to-int trick to accelerate float-to-int on |
387 | // most platforms which requires endianness be defined correctly. |
388 | //#define STB_VORBIS_NO_FAST_SCALED_FLOAT |
389 | |
390 | |
391 | // STB_VORBIS_MAX_CHANNELS [number] |
392 | // globally define this to the maximum number of channels you need. |
393 | // The spec does not put a restriction on channels except that |
394 | // the count is stored in a byte, so 255 is the hard limit. |
395 | // Reducing this saves about 16 bytes per value, so using 16 saves |
396 | // (255-16)*16 or around 4KB. Plus anything other memory usage |
397 | // I forgot to account for. Can probably go as low as 8 (7.1 audio), |
398 | // 6 (5.1 audio), or 2 (stereo only). |
399 | #ifndef STB_VORBIS_MAX_CHANNELS16 |
400 | #define STB_VORBIS_MAX_CHANNELS16 16 // enough for anyone? |
401 | #endif |
402 | |
403 | // STB_VORBIS_PUSHDATA_CRC_COUNT [number] |
404 | // after a flush_pushdata(), stb_vorbis begins scanning for the |
405 | // next valid page, without backtracking. when it finds something |
406 | // that looks like a page, it streams through it and verifies its |
407 | // CRC32. Should that validation fail, it keeps scanning. But it's |
408 | // possible that _while_ streaming through to check the CRC32 of |
409 | // one candidate page, it sees another candidate page. This #define |
410 | // determines how many "overlapping" candidate pages it can search |
411 | // at once. Note that "real" pages are typically ~4KB to ~8KB, whereas |
412 | // garbage pages could be as big as 64KB, but probably average ~16KB. |
413 | // So don't hose ourselves by scanning an apparent 64KB page and |
414 | // missing a ton of real ones in the interim; so minimum of 2 |
415 | #ifndef STB_VORBIS_PUSHDATA_CRC_COUNT4 |
416 | #define STB_VORBIS_PUSHDATA_CRC_COUNT4 4 |
417 | #endif |
418 | |
419 | // STB_VORBIS_FAST_HUFFMAN_LENGTH [number] |
420 | // sets the log size of the huffman-acceleration table. Maximum |
421 | // supported value is 24. with larger numbers, more decodings are O(1), |
422 | // but the table size is larger so worse cache missing, so you'll have |
423 | // to probe (and try multiple ogg vorbis files) to find the sweet spot. |
424 | #ifndef STB_VORBIS_FAST_HUFFMAN_LENGTH10 |
425 | #define STB_VORBIS_FAST_HUFFMAN_LENGTH10 10 |
426 | #endif |
427 | |
428 | // STB_VORBIS_FAST_BINARY_LENGTH [number] |
429 | // sets the log size of the binary-search acceleration table. this |
430 | // is used in similar fashion to the fast-huffman size to set initial |
431 | // parameters for the binary search |
432 | |
433 | // STB_VORBIS_FAST_HUFFMAN_INT |
434 | // The fast huffman tables are much more efficient if they can be |
435 | // stored as 16-bit results instead of 32-bit results. This restricts |
436 | // the codebooks to having only 65535 possible outcomes, though. |
437 | // (At least, accelerated by the huffman table.) |
438 | #ifndef STB_VORBIS_FAST_HUFFMAN_INT |
439 | #define STB_VORBIS_FAST_HUFFMAN_SHORT |
440 | #endif |
441 | |
442 | // STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH |
443 | // If the 'fast huffman' search doesn't succeed, then stb_vorbis falls |
444 | // back on binary searching for the correct one. This requires storing |
445 | // extra tables with the huffman codes in sorted order. Defining this |
446 | // symbol trades off space for speed by forcing a linear search in the |
447 | // non-fast case, except for "sparse" codebooks. |
448 | // #define STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH |
449 | |
450 | // STB_VORBIS_DIVIDES_IN_RESIDUE |
451 | // stb_vorbis precomputes the result of the scalar residue decoding |
452 | // that would otherwise require a divide per chunk. you can trade off |
453 | // space for time by defining this symbol. |
454 | // #define STB_VORBIS_DIVIDES_IN_RESIDUE |
455 | |
456 | // STB_VORBIS_DIVIDES_IN_CODEBOOK |
457 | // vorbis VQ codebooks can be encoded two ways: with every case explicitly |
458 | // stored, or with all elements being chosen from a small range of values, |
459 | // and all values possible in all elements. By default, stb_vorbis expands |
460 | // this latter kind out to look like the former kind for ease of decoding, |
461 | // because otherwise an integer divide-per-vector-element is required to |
462 | // unpack the index. If you define STB_VORBIS_DIVIDES_IN_CODEBOOK, you can |
463 | // trade off storage for speed. |
464 | //#define STB_VORBIS_DIVIDES_IN_CODEBOOK |
465 | |
466 | // STB_VORBIS_CODEBOOK_SHORTS |
467 | // The vorbis file format encodes VQ codebook floats as ax+b where a and |
468 | // b are floating point per-codebook constants, and x is a 16-bit int. |
469 | // Normally, stb_vorbis decodes them to floats rather than leaving them |
470 | // as 16-bit ints and computing ax+b while decoding. This is a speed/space |
471 | // tradeoff; you can save space by defining this flag. |
472 | #ifndef STB_VORBIS_CODEBOOK_SHORTS |
473 | #define STB_VORBIS_CODEBOOK_FLOATS |
474 | #endif |
475 | |
476 | // STB_VORBIS_DIVIDE_TABLE |
477 | // this replaces small integer divides in the floor decode loop with |
478 | // table lookups. made less than 1% difference, so disabled by default. |
479 | |
480 | // STB_VORBIS_NO_INLINE_DECODE |
481 | // disables the inlining of the scalar codebook fast-huffman decode. |
482 | // might save a little codespace; useful for debugging |
483 | // #define STB_VORBIS_NO_INLINE_DECODE |
484 | |
485 | // STB_VORBIS_NO_DEFER_FLOOR |
486 | // Normally we only decode the floor without synthesizing the actual |
487 | // full curve. We can instead synthesize the curve immediately. This |
488 | // requires more memory and is very likely slower, so I don't think |
489 | // you'd ever want to do it except for debugging. |
490 | // #define STB_VORBIS_NO_DEFER_FLOOR |
491 | |
492 | |
493 | |
494 | |
495 | ////////////////////////////////////////////////////////////////////////////// |
496 | |
497 | #ifdef STB_VORBIS_NO_PULLDATA_API |
498 | #define STB_VORBIS_NO_INTEGER_CONVERSION |
499 | #define STB_VORBIS_NO_STDIO |
500 | #endif |
501 | |
502 | #if defined(STB_VORBIS_NO_CRT) && !defined(STB_VORBIS_NO_STDIO) |
503 | #define STB_VORBIS_NO_STDIO 1 |
504 | #endif |
505 | |
506 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION |
507 | #ifndef STB_VORBIS_NO_FAST_SCALED_FLOAT |
508 | |
509 | // only need endianness for fast-float-to-int, which we don't |
510 | // use for pushdata |
511 | |
512 | #ifndef STB_VORBIS_BIG_ENDIAN |
513 | #define STB_VORBIS_ENDIAN0 0 |
514 | #else |
515 | #define STB_VORBIS_ENDIAN0 1 |
516 | #endif |
517 | |
518 | #endif |
519 | #endif |
520 | |
521 | |
522 | #ifndef STB_VORBIS_NO_STDIO |
523 | #include <stdio.h> |
524 | #endif |
525 | |
526 | #ifndef STB_VORBIS_NO_CRT |
527 | #include <stdlib.h> |
528 | #include <string.h> |
529 | #include <assert.h> |
530 | #include <math.h> |
531 | #else |
532 | #define NULL((void*)0) 0 |
533 | #endif |
534 | |
535 | #ifndef _MSC_VER |
536 | #if __GNUC__4 |
537 | #define __forceinlineinline inline |
538 | #else |
539 | #define __forceinlineinline |
540 | #endif |
541 | #endif |
542 | |
543 | #if STB_VORBIS_MAX_CHANNELS16 > 256 |
544 | #error "Value of STB_VORBIS_MAX_CHANNELS outside of allowed range" |
545 | #endif |
546 | |
547 | #if STB_VORBIS_FAST_HUFFMAN_LENGTH10 > 24 |
548 | #error "Value of STB_VORBIS_FAST_HUFFMAN_LENGTH outside of allowed range" |
549 | #endif |
550 | |
551 | |
552 | #define MAX_BLOCKSIZE_LOG13 13 // from specification |
553 | #define MAX_BLOCKSIZE(1 << 13) (1 << MAX_BLOCKSIZE_LOG13) |
554 | |
555 | |
556 | typedef unsigned char uint8; |
557 | typedef signed char int8; |
558 | typedef unsigned short uint16; |
559 | typedef signed short int16; |
560 | typedef unsigned int uint32; |
561 | typedef signed int int32; |
562 | |
563 | #ifndef TRUE1 |
564 | #define TRUE1 1 |
565 | #define FALSE0 0 |
566 | #endif |
567 | |
568 | #ifdef STB_VORBIS_CODEBOOK_FLOATS |
569 | typedef float codetype; |
570 | #else |
571 | typedef uint16 codetype; |
572 | #endif |
573 | |
574 | // @NOTE |
575 | // |
576 | // Some arrays below are tagged "//varies", which means it's actually |
577 | // a variable-sized piece of data, but rather than malloc I assume it's |
578 | // small enough it's better to just allocate it all together with the |
579 | // main thing |
580 | // |
581 | // Most of the variables are specified with the smallest size I could pack |
582 | // them into. It might give better performance to make them all full-sized |
583 | // integers. It should be safe to freely rearrange the structures or change |
584 | // the sizes larger--nothing relies on silently truncating etc., nor the |
585 | // order of variables. |
586 | |
587 | #define FAST_HUFFMAN_TABLE_SIZE(1 << 10) (1 << STB_VORBIS_FAST_HUFFMAN_LENGTH10) |
588 | #define FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1) (FAST_HUFFMAN_TABLE_SIZE(1 << 10) - 1) |
589 | |
590 | typedef struct |
591 | { |
592 | int dimensions, entries; |
593 | uint8 *codeword_lengths; |
594 | float minimum_value; |
595 | float delta_value; |
596 | uint8 value_bits; |
597 | uint8 lookup_type; |
598 | uint8 sequence_p; |
599 | uint8 sparse; |
600 | uint32 lookup_values; |
601 | codetype *multiplicands; |
602 | uint32 *codewords; |
603 | #ifdef STB_VORBIS_FAST_HUFFMAN_SHORT |
604 | int16 fast_huffman[FAST_HUFFMAN_TABLE_SIZE(1 << 10)]; |
605 | #else |
606 | int32 fast_huffman[FAST_HUFFMAN_TABLE_SIZE(1 << 10)]; |
607 | #endif |
608 | uint32 *sorted_codewords; |
609 | int *sorted_values; |
610 | int sorted_entries; |
611 | } Codebook; |
612 | |
613 | typedef struct |
614 | { |
615 | uint8 order; |
616 | uint16 rate; |
617 | uint16 bark_map_size; |
618 | uint8 amplitude_bits; |
619 | uint8 amplitude_offset; |
620 | uint8 number_of_books; |
621 | uint8 book_list[16]; // varies |
622 | } Floor0; |
623 | |
624 | typedef struct |
625 | { |
626 | uint8 partitions; |
627 | uint8 partition_class_list[32]; // varies |
628 | uint8 class_dimensions[16]; // varies |
629 | uint8 class_subclasses[16]; // varies |
630 | uint8 class_masterbooks[16]; // varies |
631 | int16 subclass_books[16][8]; // varies |
632 | uint16 Xlist[31*8+2]; // varies |
633 | uint8 sorted_order[31*8+2]; |
634 | uint8 neighbors[31*8+2][2]; |
635 | uint8 floor1_multiplier; |
636 | uint8 rangebits; |
637 | int values; |
638 | } Floor1; |
639 | |
640 | typedef union |
641 | { |
642 | Floor0 floor0; |
643 | Floor1 floor1; |
644 | } Floor; |
645 | |
646 | typedef struct |
647 | { |
648 | uint32 begin, end; |
649 | uint32 part_size; |
650 | uint8 classifications; |
651 | uint8 classbook; |
652 | uint8 **classdata; |
653 | int16 (*residue_books)[8]; |
654 | } Residue; |
655 | |
656 | typedef struct |
657 | { |
658 | uint8 magnitude; |
659 | uint8 angle; |
660 | uint8 mux; |
661 | } MappingChannel; |
662 | |
663 | typedef struct |
664 | { |
665 | uint16 coupling_steps; |
666 | MappingChannel *chan; |
667 | uint8 submaps; |
668 | uint8 submap_floor[15]; // varies |
669 | uint8 submap_residue[15]; // varies |
670 | } Mapping; |
671 | |
672 | typedef struct |
673 | { |
674 | uint8 blockflag; |
675 | uint8 mapping; |
676 | uint16 windowtype; |
677 | uint16 transformtype; |
678 | } Mode; |
679 | |
680 | typedef struct |
681 | { |
682 | uint32 goal_crc; // expected crc if match |
683 | int bytes_left; // bytes left in packet |
684 | uint32 crc_so_far; // running crc |
685 | int bytes_done; // bytes processed in _current_ chunk |
686 | uint32 sample_loc; // granule pos encoded in page |
687 | } CRCscan; |
688 | |
689 | typedef struct |
690 | { |
691 | uint32 page_start, page_end; |
692 | uint32 after_previous_page_start; |
693 | uint32 first_decoded_sample; |
694 | uint32 last_decoded_sample; |
695 | } ProbedPage; |
696 | |
697 | struct stb_vorbis |
698 | { |
699 | // user-accessible info |
700 | unsigned int sample_rate; |
701 | int channels; |
702 | |
703 | unsigned int setup_memory_required; |
704 | unsigned int temp_memory_required; |
705 | unsigned int setup_temp_memory_required; |
706 | |
707 | // input config |
708 | #ifndef STB_VORBIS_NO_STDIO |
709 | FILE *f; |
710 | uint32 f_start; |
711 | int close_on_free; |
712 | #endif |
713 | |
714 | uint8 *stream; |
715 | uint8 *stream_start; |
716 | uint8 *stream_end; |
717 | |
718 | uint32 stream_len; |
719 | |
720 | uint8 push_mode; |
721 | |
722 | uint32 first_audio_page_offset; |
723 | |
724 | ProbedPage p_first, p_last; |
725 | |
726 | // memory management |
727 | stb_vorbis_alloc alloc; |
728 | int setup_offset; |
729 | int temp_offset; |
730 | |
731 | // run-time results |
732 | int eof; |
733 | enum STBVorbisError error; |
734 | |
735 | // user-useful data |
736 | |
737 | // header info |
738 | int blocksize[2]; |
739 | int blocksize_0, blocksize_1; |
740 | int codebook_count; |
741 | Codebook *codebooks; |
742 | int floor_count; |
743 | uint16 floor_types[64]; // varies |
744 | Floor *floor_config; |
745 | int residue_count; |
746 | uint16 residue_types[64]; // varies |
747 | Residue *residue_config; |
748 | int mapping_count; |
749 | Mapping *mapping; |
750 | int mode_count; |
751 | Mode mode_config[64]; // varies |
752 | |
753 | uint32 total_samples; |
754 | |
755 | // decode buffer |
756 | float *channel_buffers[STB_VORBIS_MAX_CHANNELS16]; |
757 | float *outputs [STB_VORBIS_MAX_CHANNELS16]; |
758 | |
759 | float *previous_window[STB_VORBIS_MAX_CHANNELS16]; |
760 | int previous_length; |
761 | |
762 | #ifndef STB_VORBIS_NO_DEFER_FLOOR |
763 | int16 *finalY[STB_VORBIS_MAX_CHANNELS16]; |
764 | #else |
765 | float *floor_buffers[STB_VORBIS_MAX_CHANNELS16]; |
766 | #endif |
767 | |
768 | uint32 current_loc; // sample location of next frame to decode |
769 | int current_loc_valid; |
770 | |
771 | // per-blocksize precomputed data |
772 | |
773 | // twiddle factors |
774 | float *A[2],*B[2],*C(2 | 4 | 1)[2]; |
775 | float *window[2]; |
776 | uint16 *bit_reverse[2]; |
777 | |
778 | // current page/packet/segment streaming info |
779 | uint32 serial; // stream serial number for verification |
780 | int last_page; |
781 | int segment_count; |
782 | uint8 segments[255]; |
783 | uint8 page_flag; |
784 | uint8 bytes_in_seg; |
785 | uint8 first_decode; |
786 | int next_seg; |
787 | int last_seg; // flag that we're on the last segment |
788 | int last_seg_which; // what was the segment number of the last seg? |
789 | uint32 acc; |
790 | int valid_bits; |
791 | int packet_bytes; |
792 | int end_seg_with_known_loc; |
793 | uint32 known_loc_for_packet; |
794 | int discard_samples_deferred; |
795 | uint32 samples_output; |
796 | |
797 | // push mode scanning |
798 | int page_crc_tests; // only in push_mode: number of tests active; -1 if not searching |
799 | #ifndef STB_VORBIS_NO_PUSHDATA_API |
800 | CRCscan scan[STB_VORBIS_PUSHDATA_CRC_COUNT4]; |
801 | #endif |
802 | |
803 | // sample-access |
804 | int channel_buffer_start; |
805 | int channel_buffer_end; |
806 | }; |
807 | |
808 | extern int my_prof(int slot); |
809 | //#define stb_prof my_prof |
810 | |
811 | #ifndef stb_prof |
812 | #define stb_prof(x)(void)0 (void)0 |
813 | #endif |
814 | |
815 | #if defined(STB_VORBIS_NO_PUSHDATA_API) |
816 | #define IS_PUSH_MODE(f)((f)->push_mode) FALSE0 |
817 | #elif defined(STB_VORBIS_NO_PULLDATA_API) |
818 | #define IS_PUSH_MODE(f)((f)->push_mode) TRUE1 |
819 | #else |
820 | #define IS_PUSH_MODE(f)((f)->push_mode) ((f)->push_mode) |
821 | #endif |
822 | |
823 | typedef struct stb_vorbis vorb; |
824 | |
825 | static int error(vorb *f, enum STBVorbisError e) |
826 | { |
827 | f->error = e; |
828 | if (!f->eof && e != VORBIS_need_more_data) { |
829 | f->error=e; // breakpoint for debugging |
830 | } |
831 | return 0; |
832 | } |
833 | |
834 | |
835 | // these functions are used for allocating temporary memory |
836 | // while decoding. if you can afford the stack space, use |
837 | // alloca(); otherwise, provide a temp buffer and it will |
838 | // allocate out of those. |
839 | |
840 | #define array_size_required(count,size)(count*(sizeof(void *)+(size))) (count*(sizeof(void *)+(size))) |
841 | |
842 | #define temp_alloc(f,size)(f->alloc.alloc_buffer ? setup_temp_malloc(f,size) : alloca (size)) (f->alloc.alloc_buffer ? setup_temp_malloc(f,size) : alloca(size)) |
843 | #ifdef dealloca |
844 | #define temp_free(f,p)0 (f->alloc.alloc_buffer ? 0 : dealloca(size)) |
845 | #else |
846 | #define temp_free(f,p)0 0 |
847 | #endif |
848 | #define temp_alloc_save(f)((f)->temp_offset) ((f)->temp_offset) |
849 | #define temp_alloc_restore(f,p)((f)->temp_offset = (p)) ((f)->temp_offset = (p)) |
850 | |
851 | #define temp_block_array(f,count,size)make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(count*(sizeof(void *)+(size)))) : alloca((count*(sizeof(void *)+(size))))), count, size) make_block_array(temp_alloc(f,array_size_required(count,size))(f->alloc.alloc_buffer ? setup_temp_malloc(f,(count*(sizeof (void *)+(size)))) : alloca((count*(sizeof(void *)+(size))))), count, size) |
852 | |
853 | // given a sufficiently large block of memory, make an array of pointers to subblocks of it |
854 | static void *make_block_array(void *mem, int count, int size) |
855 | { |
856 | int i; |
857 | void ** p = (void **) mem; |
858 | char *q = (char *) (p + count); |
859 | for (i=0; i < count; ++i) { |
860 | p[i] = q; |
861 | q += size; |
862 | } |
863 | return p; |
864 | } |
865 | |
866 | static void *setup_malloc(vorb *f, int sz) |
867 | { |
868 | sz = (sz+3) & ~3; |
869 | f->setup_memory_required += sz; |
870 | if (f->alloc.alloc_buffer) { |
871 | void *p = (char *) f->alloc.alloc_buffer + f->setup_offset; |
872 | if (f->setup_offset + sz > f->temp_offset) return NULL((void*)0); |
873 | f->setup_offset += sz; |
874 | return p; |
875 | } |
876 | return sz ? malloc(sz) : NULL((void*)0); |
877 | } |
878 | |
879 | static void setup_free(vorb *f, void *p) |
880 | { |
881 | if (f->alloc.alloc_buffer) return; // do nothing; setup mem is not a stack |
882 | free(p); |
883 | } |
884 | |
885 | static void *setup_temp_malloc(vorb *f, int sz) |
886 | { |
887 | sz = (sz+3) & ~3; |
888 | if (f->alloc.alloc_buffer) { |
889 | if (f->temp_offset - sz < f->setup_offset) return NULL((void*)0); |
890 | f->temp_offset -= sz; |
891 | return (char *) f->alloc.alloc_buffer + f->temp_offset; |
892 | } |
893 | return malloc(sz); |
894 | } |
895 | |
896 | static void setup_temp_free(vorb *f, void *p, size_t sz) |
897 | { |
898 | if (f->alloc.alloc_buffer) { |
899 | f->temp_offset += (sz+3)&~3; |
900 | return; |
901 | } |
902 | free(p); |
903 | } |
904 | |
905 | #define CRC32_POLY0x04c11db7 0x04c11db7 // from spec |
906 | |
907 | static uint32 crc_table[256]; |
908 | static void crc32_init(void) |
909 | { |
910 | int i,j; |
911 | uint32 s; |
912 | for(i=0; i < 256; i++) { |
913 | for (s=i<<24, j=0; j < 8; ++j) |
914 | s = (s << 1) ^ (s >= (1<<31) ? CRC32_POLY0x04c11db7 : 0); |
915 | crc_table[i] = s; |
916 | } |
917 | } |
918 | |
919 | static __forceinlineinline uint32 crc32_update(uint32 crc, uint8 byte) |
920 | { |
921 | return (crc << 8) ^ crc_table[byte ^ (crc >> 24)]; |
922 | } |
923 | |
924 | |
925 | // used in setup, and for huffman that doesn't go fast path |
926 | static unsigned int bit_reverse(unsigned int n) |
927 | { |
928 | n = ((n & 0xAAAAAAAA) >> 1) | ((n & 0x55555555) << 1); |
929 | n = ((n & 0xCCCCCCCC) >> 2) | ((n & 0x33333333) << 2); |
930 | n = ((n & 0xF0F0F0F0) >> 4) | ((n & 0x0F0F0F0F) << 4); |
931 | n = ((n & 0xFF00FF00) >> 8) | ((n & 0x00FF00FF) << 8); |
932 | return (n >> 16) | (n << 16); |
933 | } |
934 | |
935 | static float square(float x) |
936 | { |
937 | return x*x; |
938 | } |
939 | |
940 | // this is a weird definition of log2() for which log2(1) = 1, log2(2) = 2, log2(4) = 3 |
941 | // as required by the specification. fast(?) implementation from stb.h |
942 | // @OPTIMIZE: called multiple times per-packet with "constants"; move to setup |
943 | static int ilog(int32 n) |
944 | { |
945 | static signed char log2_4[16] = { 0,1,2,2,3,3,3,3,4,4,4,4,4,4,4,4 }; |
946 | |
947 | // 2 compares if n < 16, 3 compares otherwise (4 if signed or n > 1<<29) |
948 | if (n < (1U << 14)) |
949 | if (n < (1U << 4)) return 0 + log2_4[n ]; |
950 | else if (n < (1U << 9)) return 5 + log2_4[n >> 5]; |
951 | else return 10 + log2_4[n >> 10]; |
952 | else if (n < (1U << 24)) |
953 | if (n < (1U << 19)) return 15 + log2_4[n >> 15]; |
954 | else return 20 + log2_4[n >> 20]; |
955 | else if (n < (1U << 29)) return 25 + log2_4[n >> 25]; |
956 | else if (n < (1U << 31)) return 30 + log2_4[n >> 30]; |
957 | else return 0; // signed n returns 0 |
958 | } |
959 | |
960 | #ifndef M_PI3.14159265358979323846 |
961 | #define M_PI3.14159265358979323846 3.14159265358979323846264f // from CRC |
962 | #endif |
963 | |
964 | // code length assigned to a value with no huffman encoding |
965 | #define NO_CODE255 255 |
966 | |
967 | /////////////////////// LEAF SETUP FUNCTIONS ////////////////////////// |
968 | // |
969 | // these functions are only called at setup, and only a few times |
970 | // per file |
971 | |
972 | static float float32_unpack(uint32 x) |
973 | { |
974 | // from the specification |
975 | uint32 mantissa = x & 0x1fffff; |
976 | uint32 sign = x & 0x80000000; |
977 | uint32 exp = (x & 0x7fe00000) >> 21; |
978 | double res = sign ? -(double)mantissa : (double)mantissa; |
979 | return (float) ldexp((float)res, exp-788); |
980 | } |
981 | |
982 | |
983 | // zlib & jpeg huffman tables assume that the output symbols |
984 | // can either be arbitrarily arranged, or have monotonically |
985 | // increasing frequencies--they rely on the lengths being sorted; |
986 | // this makes for a very simple generation algorithm. |
987 | // vorbis allows a huffman table with non-sorted lengths. This |
988 | // requires a more sophisticated construction, since symbols in |
989 | // order do not map to huffman codes "in order". |
990 | static void add_entry(Codebook *c, uint32 huff_code, int symbol, int count, int len, uint32 *values) |
991 | { |
992 | if (!c->sparse) { |
993 | c->codewords [symbol] = huff_code; |
994 | } else { |
995 | c->codewords [count] = huff_code; |
996 | c->codeword_lengths[count] = len; |
997 | values [count] = symbol; |
998 | } |
999 | } |
1000 | |
1001 | static int compute_codewords(Codebook *c, uint8 *len, int n, uint32 *values) |
1002 | { |
1003 | int i,k,m=0; |
1004 | uint32 available[32]; |
1005 | |
1006 | memset(available, 0, sizeof(available)); |
1007 | // find the first entry |
1008 | for (k=0; k < n; ++k) if (len[k] < NO_CODE255) break; |
1009 | if (k == n) { assert(c->sorted_entries == 0)((c->sorted_entries == 0) ? (void)0 : _assert("c->sorted_entries == 0" , "src/siege/internal/stb/stb_vorbis.c", 1009)); return TRUE1; } |
1010 | // add to the list |
1011 | add_entry(c, 0, k, m++, len[k], values); |
1012 | // add all available leaves |
1013 | for (i=1; i <= len[k]; ++i) |
1014 | available[i] = 1 << (32-i); |
1015 | // note that the above code treats the first case specially, |
1016 | // but it's really the same as the following code, so they |
1017 | // could probably be combined (except the initial code is 0, |
1018 | // and I use 0 in available[] to mean 'empty') |
1019 | for (i=k+1; i < n; ++i) { |
1020 | uint32 res; |
1021 | int z = len[i], y; |
1022 | if (z == NO_CODE255) continue; |
1023 | // find lowest available leaf (should always be earliest, |
1024 | // which is what the specification calls for) |
1025 | // note that this property, and the fact we can never have |
1026 | // more than one free leaf at a given level, isn't totally |
1027 | // trivial to prove, but it seems true and the assert never |
1028 | // fires, so! |
1029 | while (z > 0 && !available[z]) --z; |
1030 | if (z == 0) { assert(0)((0) ? (void)0 : _assert("0", "src/siege/internal/stb/stb_vorbis.c" , 1030)); return FALSE0; } |
1031 | res = available[z]; |
1032 | available[z] = 0; |
1033 | add_entry(c, bit_reverse(res), i, m++, len[i], values); |
1034 | // propogate availability up the tree |
1035 | if (z != len[i]) { |
1036 | for (y=len[i]; y > z; --y) { |
1037 | assert(available[y] == 0)((available[y] == 0) ? (void)0 : _assert("available[y] == 0", "src/siege/internal/stb/stb_vorbis.c", 1037)); |
1038 | available[y] = res + (1 << (32-y)); |
1039 | } |
1040 | } |
1041 | } |
1042 | return TRUE1; |
1043 | } |
1044 | |
1045 | // accelerated huffman table allows fast O(1) match of all symbols |
1046 | // of length <= STB_VORBIS_FAST_HUFFMAN_LENGTH |
1047 | static void compute_accelerated_huffman(Codebook *c) |
1048 | { |
1049 | int i, len; |
1050 | for (i=0; i < FAST_HUFFMAN_TABLE_SIZE(1 << 10); ++i) |
1051 | c->fast_huffman[i] = -1; |
1052 | |
1053 | len = c->sparse ? c->sorted_entries : c->entries; |
1054 | #ifdef STB_VORBIS_FAST_HUFFMAN_SHORT |
1055 | if (len > 32767) len = 32767; // largest possible value we can encode! |
1056 | #endif |
1057 | for (i=0; i < len; ++i) { |
1058 | if (c->codeword_lengths[i] <= STB_VORBIS_FAST_HUFFMAN_LENGTH10) { |
1059 | uint32 z = c->sparse ? bit_reverse(c->sorted_codewords[i]) : c->codewords[i]; |
1060 | // set table entries for all bit combinations in the higher bits |
1061 | while (z < FAST_HUFFMAN_TABLE_SIZE(1 << 10)) { |
1062 | c->fast_huffman[z] = i; |
1063 | z += 1 << c->codeword_lengths[i]; |
1064 | } |
1065 | } |
1066 | } |
1067 | } |
1068 | |
1069 | static int uint32_compare(const void *p, const void *q) |
1070 | { |
1071 | uint32 x = * (uint32 *) p; |
1072 | uint32 y = * (uint32 *) q; |
1073 | return x < y ? -1 : x > y; |
1074 | } |
1075 | |
1076 | static int include_in_sort(Codebook *c, uint8 len) |
1077 | { |
1078 | if (c->sparse) { assert(len != NO_CODE)((len != 255) ? (void)0 : _assert("len != NO_CODE", "src/siege/internal/stb/stb_vorbis.c" , 1078)); return TRUE1; } |
1079 | if (len == NO_CODE255) return FALSE0; |
1080 | if (len > STB_VORBIS_FAST_HUFFMAN_LENGTH10) return TRUE1; |
1081 | return FALSE0; |
1082 | } |
1083 | |
1084 | // if the fast table above doesn't work, we want to binary |
1085 | // search them... need to reverse the bits |
1086 | static void compute_sorted_huffman(Codebook *c, uint8 *lengths, uint32 *values) |
1087 | { |
1088 | int i, len; |
1089 | // build a list of all the entries |
1090 | // OPTIMIZATION: don't include the short ones, since they'll be caught by FAST_HUFFMAN. |
1091 | // this is kind of a frivolous optimization--I don't see any performance improvement, |
1092 | // but it's like 4 extra lines of code, so. |
1093 | if (!c->sparse) { |
1094 | int k = 0; |
1095 | for (i=0; i < c->entries; ++i) |
1096 | if (include_in_sort(c, lengths[i])) |
1097 | c->sorted_codewords[k++] = bit_reverse(c->codewords[i]); |
1098 | assert(k == c->sorted_entries)((k == c->sorted_entries) ? (void)0 : _assert("k == c->sorted_entries" , "src/siege/internal/stb/stb_vorbis.c", 1098)); |
1099 | } else { |
1100 | for (i=0; i < c->sorted_entries; ++i) |
1101 | c->sorted_codewords[i] = bit_reverse(c->codewords[i]); |
1102 | } |
1103 | |
1104 | qsort(c->sorted_codewords, c->sorted_entries, sizeof(c->sorted_codewords[0]), uint32_compare); |
1105 | c->sorted_codewords[c->sorted_entries] = 0xffffffff; |
1106 | |
1107 | len = c->sparse ? c->sorted_entries : c->entries; |
1108 | // now we need to indicate how they correspond; we could either |
1109 | // #1: sort a different data structure that says who they correspond to |
1110 | // #2: for each sorted entry, search the original list to find who corresponds |
1111 | // #3: for each original entry, find the sorted entry |
1112 | // #1 requires extra storage, #2 is slow, #3 can use binary search! |
1113 | for (i=0; i < len; ++i) { |
1114 | int huff_len = c->sparse ? lengths[values[i]] : lengths[i]; |
1115 | if (include_in_sort(c,huff_len)) { |
1116 | uint32 code = bit_reverse(c->codewords[i]); |
1117 | int x=0, n=c->sorted_entries; |
1118 | while (n > 1) { |
1119 | // invariant: sc[x] <= code < sc[x+n] |
1120 | int m = x + (n >> 1); |
1121 | if (c->sorted_codewords[m] <= code) { |
1122 | x = m; |
1123 | n -= (n>>1); |
1124 | } else { |
1125 | n >>= 1; |
1126 | } |
1127 | } |
1128 | assert(c->sorted_codewords[x] == code)((c->sorted_codewords[x] == code) ? (void)0 : _assert("c->sorted_codewords[x] == code" , "src/siege/internal/stb/stb_vorbis.c", 1128)); |
1129 | if (c->sparse) { |
1130 | c->sorted_values[x] = values[i]; |
1131 | c->codeword_lengths[x] = huff_len; |
1132 | } else { |
1133 | c->sorted_values[x] = i; |
1134 | } |
1135 | } |
1136 | } |
1137 | } |
1138 | |
1139 | // only run while parsing the header (3 times) |
1140 | static int vorbis_validate(uint8 *data) |
1141 | { |
1142 | static uint8 vorbis[6] = { 'v', 'o', 'r', 'b', 'i', 's' }; |
1143 | return memcmp(data, vorbis, 6) == 0; |
1144 | } |
1145 | |
1146 | // called from setup only, once per code book |
1147 | // (formula implied by specification) |
1148 | static int lookup1_values(int entries, int dim) |
1149 | { |
1150 | int r = (int) floor(exp((float) log((float) entries) / dim)); |
1151 | if ((int) floor(pow((float) r+1, dim)) <= entries) // (int) cast for MinGW warning; |
1152 | ++r; // floor() to avoid _ftol() when non-CRT |
1153 | assert(pow((float) r+1, dim) > entries)((pow((float) r+1, dim) > entries) ? (void)0 : _assert("pow((float) r+1, dim) > entries" , "src/siege/internal/stb/stb_vorbis.c", 1153)); |
1154 | assert((int) floor(pow((float) r, dim)) <= entries)(((int) floor(pow((float) r, dim)) <= entries) ? (void)0 : _assert("(int) floor(pow((float) r, dim)) <= entries", "src/siege/internal/stb/stb_vorbis.c" , 1154)); // (int),floor() as above |
1155 | return r; |
1156 | } |
1157 | |
1158 | // called twice per file |
1159 | static void compute_twiddle_factors(int n, float *A, float *B, float *C(2 | 4 | 1)) |
1160 | { |
1161 | int n4 = n >> 2, n8 = n >> 3; |
1162 | int k,k2; |
1163 | |
1164 | for (k=k2=0; k < n4; ++k,k2+=2) { |
1165 | A[k2 ] = (float) cos(4*k*M_PI3.14159265358979323846/n); |
1166 | A[k2+1] = (float) -sin(4*k*M_PI3.14159265358979323846/n); |
1167 | B[k2 ] = (float) cos((k2+1)*M_PI3.14159265358979323846/n/2) * 0.5f; |
1168 | B[k2+1] = (float) sin((k2+1)*M_PI3.14159265358979323846/n/2) * 0.5f; |
1169 | } |
1170 | for (k=k2=0; k < n8; ++k,k2+=2) { |
1171 | C(2 | 4 | 1)[k2 ] = (float) cos(2*(k2+1)*M_PI3.14159265358979323846/n); |
1172 | C(2 | 4 | 1)[k2+1] = (float) -sin(2*(k2+1)*M_PI3.14159265358979323846/n); |
1173 | } |
1174 | } |
1175 | |
1176 | static void compute_window(int n, float *window) |
1177 | { |
1178 | int n2 = n >> 1, i; |
1179 | for (i=0; i < n2; ++i) |
1180 | window[i] = (float) sin(0.5 * M_PI3.14159265358979323846 * square((float) sin((i - 0 + 0.5) / n2 * 0.5 * M_PI3.14159265358979323846))); |
1181 | } |
1182 | |
1183 | static void compute_bitreverse(int n, uint16 *rev) |
1184 | { |
1185 | int ld = ilog(n) - 1; // ilog is off-by-one from normal definitions |
1186 | int i, n8 = n >> 3; |
1187 | for (i=0; i < n8; ++i) |
1188 | rev[i] = (bit_reverse(i) >> (32-ld+3)) << 2; |
1189 | } |
1190 | |
1191 | static int init_blocksize(vorb *f, int b, int n) |
1192 | { |
1193 | int n2 = n >> 1, n4 = n >> 2, n8 = n >> 3; |
1194 | f->A[b] = (float *) setup_malloc(f, sizeof(float) * n2); |
1195 | f->B[b] = (float *) setup_malloc(f, sizeof(float) * n2); |
1196 | f->C(2 | 4 | 1)[b] = (float *) setup_malloc(f, sizeof(float) * n4); |
1197 | if (!f->A[b] || !f->B[b] || !f->C(2 | 4 | 1)[b]) return error(f, VORBIS_outofmem); |
1198 | compute_twiddle_factors(n, f->A[b], f->B[b], f->C(2 | 4 | 1)[b]); |
1199 | f->window[b] = (float *) setup_malloc(f, sizeof(float) * n2); |
1200 | if (!f->window[b]) return error(f, VORBIS_outofmem); |
1201 | compute_window(n, f->window[b]); |
1202 | f->bit_reverse[b] = (uint16 *) setup_malloc(f, sizeof(uint16) * n8); |
1203 | if (!f->bit_reverse[b]) return error(f, VORBIS_outofmem); |
1204 | compute_bitreverse(n, f->bit_reverse[b]); |
1205 | return TRUE1; |
1206 | } |
1207 | |
1208 | static void neighbors(uint16 *x, int n, int *plow, int *phigh) |
1209 | { |
1210 | int low = -1; |
1211 | int high = 65536; |
1212 | int i; |
1213 | for (i=0; i < n; ++i) { |
1214 | if (x[i] > low && x[i] < x[n]) { *plow = i; low = x[i]; } |
1215 | if (x[i] < high && x[i] > x[n]) { *phigh = i; high = x[i]; } |
1216 | } |
1217 | } |
1218 | |
1219 | // this has been repurposed so y is now the original index instead of y |
1220 | typedef struct |
1221 | { |
1222 | uint16 x,y; |
1223 | } Point; |
1224 | |
1225 | int point_compare(const void *p, const void *q) |
1226 | { |
1227 | Point *a = (Point *) p; |
1228 | Point *b = (Point *) q; |
1229 | return a->x < b->x ? -1 : a->x > b->x; |
1230 | } |
1231 | |
1232 | // |
1233 | /////////////////////// END LEAF SETUP FUNCTIONS ////////////////////////// |
1234 | |
1235 | |
1236 | #if defined(STB_VORBIS_NO_STDIO) |
1237 | #define USE_MEMORY(z)((z)->stream) TRUE1 |
1238 | #else |
1239 | #define USE_MEMORY(z)((z)->stream) ((z)->stream) |
1240 | #endif |
1241 | |
1242 | static uint8 get8(vorb *z) |
1243 | { |
1244 | if (USE_MEMORY(z)((z)->stream)) { |
1245 | if (z->stream >= z->stream_end) { z->eof = TRUE1; return 0; } |
1246 | return *z->stream++; |
1247 | } |
1248 | |
1249 | #ifndef STB_VORBIS_NO_STDIO |
1250 | { |
1251 | int c = fgetc(z->f); |
1252 | if (c == EOF(-1)) { z->eof = TRUE1; return 0; } |
1253 | return c; |
1254 | } |
1255 | #endif |
1256 | } |
1257 | |
1258 | static uint32 get32(vorb *f) |
1259 | { |
1260 | uint32 x; |
1261 | x = get8(f); |
1262 | x += get8(f) << 8; |
1263 | x += get8(f) << 16; |
1264 | x += get8(f) << 24; |
1265 | return x; |
1266 | } |
1267 | |
1268 | static int getn(vorb *z, uint8 *data, int n) |
1269 | { |
1270 | if (USE_MEMORY(z)((z)->stream)) { |
1271 | if (z->stream+n > z->stream_end) { z->eof = 1; return 0; } |
1272 | memcpy(data, z->stream, n); |
1273 | z->stream += n; |
1274 | return 1; |
1275 | } |
1276 | |
1277 | #ifndef STB_VORBIS_NO_STDIO |
1278 | if (fread(data, n, 1, z->f) == 1) |
1279 | return 1; |
1280 | else { |
1281 | z->eof = 1; |
1282 | return 0; |
1283 | } |
1284 | #endif |
1285 | } |
1286 | |
1287 | static void skip(vorb *z, int n) |
1288 | { |
1289 | if (USE_MEMORY(z)((z)->stream)) { |
1290 | z->stream += n; |
1291 | if (z->stream >= z->stream_end) z->eof = 1; |
1292 | return; |
1293 | } |
1294 | #ifndef STB_VORBIS_NO_STDIO |
1295 | { |
1296 | long x = ftell(z->f); |
1297 | fseek(z->f, x+n, SEEK_SET0); |
1298 | } |
1299 | #endif |
1300 | } |
1301 | |
1302 | static int set_file_offset(stb_vorbis *f, unsigned int loc) |
1303 | { |
1304 | #ifndef STB_VORBIS_NO_PUSHDATA_API |
1305 | if (f->push_mode) return 0; |
1306 | #endif |
1307 | f->eof = 0; |
1308 | if (USE_MEMORY(f)((f)->stream)) { |
1309 | if (f->stream_start + loc >= f->stream_end || f->stream_start + loc < f->stream_start) { |
1310 | f->stream = f->stream_end; |
1311 | f->eof = 1; |
1312 | return 0; |
1313 | } else { |
1314 | f->stream = f->stream_start + loc; |
1315 | return 1; |
1316 | } |
1317 | } |
1318 | #ifndef STB_VORBIS_NO_STDIO |
1319 | if (loc + f->f_start < loc || loc >= 0x80000000) { |
1320 | loc = 0x7fffffff; |
1321 | f->eof = 1; |
1322 | } else { |
1323 | loc += f->f_start; |
1324 | } |
1325 | if (!fseek(f->f, loc, SEEK_SET0)) |
1326 | return 1; |
1327 | f->eof = 1; |
1328 | fseek(f->f, f->f_start, SEEK_END2); |
1329 | return 0; |
1330 | #endif |
1331 | } |
1332 | |
1333 | |
1334 | static uint8 ogg_page_header[4] = { 0x4f, 0x67, 0x67, 0x53 }; |
1335 | |
1336 | static int capture_pattern(vorb *f) |
1337 | { |
1338 | if (0x4f != get8(f)) return FALSE0; |
1339 | if (0x67 != get8(f)) return FALSE0; |
1340 | if (0x67 != get8(f)) return FALSE0; |
1341 | if (0x53 != get8(f)) return FALSE0; |
1342 | return TRUE1; |
1343 | } |
1344 | |
1345 | #define PAGEFLAG_continued_packet1 1 |
1346 | #define PAGEFLAG_first_page2 2 |
1347 | #define PAGEFLAG_last_page4 4 |
1348 | |
1349 | static int start_page_no_capturepattern(vorb *f) |
1350 | { |
1351 | uint32 loc0,loc1,n; |
1352 | int32 i; |
1353 | // stream structure version |
1354 | if (0 != get8(f)) return error(f, VORBIS_invalid_stream_structure_version); |
1355 | // header flag |
1356 | f->page_flag = get8(f); |
1357 | // absolute granule position |
1358 | loc0 = get32(f); |
1359 | loc1 = get32(f); |
1360 | // @TODO: validate loc0,loc1 as valid positions? |
1361 | // stream serial number -- vorbis doesn't interleave, so discard |
1362 | get32(f); |
1363 | //if (f->serial != get32(f)) return error(f, VORBIS_incorrect_stream_serial_number); |
1364 | // page sequence number |
1365 | n = get32(f); |
1366 | f->last_page = n; |
1367 | // CRC32 |
1368 | get32(f); |
1369 | // page_segments |
1370 | f->segment_count = get8(f); |
1371 | if (!getn(f, f->segments, f->segment_count)) |
1372 | return error(f, VORBIS_unexpected_eof); |
1373 | // assume we _don't_ know any the sample position of any segments |
1374 | f->end_seg_with_known_loc = -2; |
1375 | if (loc0 != ~0 || loc1 != ~0) { |
1376 | // determine which packet is the last one that will complete |
1377 | for (i=f->segment_count-1; i >= 0; --i) |
1378 | if (f->segments[i] < 255) |
1379 | break; |
1380 | // 'i' is now the index of the _last_ segment of a packet that ends |
1381 | if (i >= 0) { |
1382 | f->end_seg_with_known_loc = i; |
1383 | f->known_loc_for_packet = loc0; |
1384 | } |
1385 | } |
1386 | if (f->first_decode) { |
1387 | int i,len; |
1388 | ProbedPage p; |
1389 | len = 0; |
1390 | for (i=0; i < f->segment_count; ++i) |
1391 | len += f->segments[i]; |
1392 | len += 27 + f->segment_count; |
1393 | p.page_start = f->first_audio_page_offset; |
1394 | p.page_end = p.page_start + len; |
1395 | p.after_previous_page_start = p.page_start; |
1396 | p.first_decoded_sample = 0; |
1397 | p.last_decoded_sample = loc0; |
1398 | f->p_first = p; |
1399 | } |
1400 | f->next_seg = 0; |
1401 | return TRUE1; |
1402 | } |
1403 | |
1404 | static int start_page(vorb *f) |
1405 | { |
1406 | if (!capture_pattern(f)) return error(f, VORBIS_missing_capture_pattern); |
1407 | return start_page_no_capturepattern(f); |
1408 | } |
1409 | |
1410 | static int start_packet(vorb *f) |
1411 | { |
1412 | while (f->next_seg == -1) { |
1413 | if (!start_page(f)) return FALSE0; |
1414 | if (f->page_flag & PAGEFLAG_continued_packet1) |
1415 | return error(f, VORBIS_continued_packet_flag_invalid); |
1416 | } |
1417 | f->last_seg = FALSE0; |
1418 | f->valid_bits = 0; |
1419 | f->packet_bytes = 0; |
1420 | f->bytes_in_seg = 0; |
1421 | // f->next_seg is now valid |
1422 | return TRUE1; |
1423 | } |
1424 | |
1425 | static int maybe_start_packet(vorb *f) |
1426 | { |
1427 | if (f->next_seg == -1) { |
1428 | int x = get8(f); |
1429 | if (f->eof) return FALSE0; // EOF at page boundary is not an error! |
1430 | if (0x4f != x ) return error(f, VORBIS_missing_capture_pattern); |
1431 | if (0x67 != get8(f)) return error(f, VORBIS_missing_capture_pattern); |
1432 | if (0x67 != get8(f)) return error(f, VORBIS_missing_capture_pattern); |
1433 | if (0x53 != get8(f)) return error(f, VORBIS_missing_capture_pattern); |
1434 | if (!start_page_no_capturepattern(f)) return FALSE0; |
1435 | if (f->page_flag & PAGEFLAG_continued_packet1) { |
1436 | // set up enough state that we can read this packet if we want, |
1437 | // e.g. during recovery |
1438 | f->last_seg = FALSE0; |
1439 | f->bytes_in_seg = 0; |
1440 | return error(f, VORBIS_continued_packet_flag_invalid); |
1441 | } |
1442 | } |
1443 | return start_packet(f); |
1444 | } |
1445 | |
1446 | static int next_segment(vorb *f) |
1447 | { |
1448 | int len; |
1449 | if (f->last_seg) return 0; |
1450 | if (f->next_seg == -1) { |
1451 | f->last_seg_which = f->segment_count-1; // in case start_page fails |
1452 | if (!start_page(f)) { f->last_seg = 1; return 0; } |
1453 | if (!(f->page_flag & PAGEFLAG_continued_packet1)) return error(f, VORBIS_continued_packet_flag_invalid); |
1454 | } |
1455 | len = f->segments[f->next_seg++]; |
1456 | if (len < 255) { |
1457 | f->last_seg = TRUE1; |
1458 | f->last_seg_which = f->next_seg-1; |
1459 | } |
1460 | if (f->next_seg >= f->segment_count) |
1461 | f->next_seg = -1; |
1462 | assert(f->bytes_in_seg == 0)((f->bytes_in_seg == 0) ? (void)0 : _assert("f->bytes_in_seg == 0" , "src/siege/internal/stb/stb_vorbis.c", 1462)); |
1463 | f->bytes_in_seg = len; |
1464 | return len; |
1465 | } |
1466 | |
1467 | #define EOP(-1) (-1) |
1468 | #define INVALID_BITS(-1) (-1) |
1469 | |
1470 | static int get8_packet_raw(vorb *f) |
1471 | { |
1472 | if (!f->bytes_in_seg) |
1473 | { |
1474 | if (f->last_seg) return EOP(-1); |
1475 | else if (!next_segment(f)) return EOP(-1); |
1476 | } |
1477 | assert(f->bytes_in_seg > 0)((f->bytes_in_seg > 0) ? (void)0 : _assert("f->bytes_in_seg > 0" , "src/siege/internal/stb/stb_vorbis.c", 1477)); |
1478 | --f->bytes_in_seg; |
1479 | ++f->packet_bytes; |
1480 | return get8(f); |
1481 | } |
1482 | |
1483 | static int get8_packet(vorb *f) |
1484 | { |
1485 | int x = get8_packet_raw(f); |
1486 | f->valid_bits = 0; |
1487 | return x; |
1488 | } |
1489 | |
1490 | static void flush_packet(vorb *f) |
1491 | { |
1492 | while (get8_packet_raw(f) != EOP(-1)); |
1493 | } |
1494 | |
1495 | // @OPTIMIZE: this is the secondary bit decoder, so it's probably not as important |
1496 | // as the huffman decoder? |
1497 | static uint32 get_bits(vorb *f, int n) |
1498 | { |
1499 | uint32 z; |
1500 | |
1501 | if (f->valid_bits < 0) return 0; |
1502 | if (f->valid_bits < n) { |
1503 | if (n > 24) { |
1504 | // the accumulator technique below would not work correctly in this case |
1505 | z = get_bits(f, 24); |
1506 | z += get_bits(f, n-24) << 24; |
1507 | return z; |
1508 | } |
1509 | if (f->valid_bits == 0) f->acc = 0; |
1510 | while (f->valid_bits < n) { |
1511 | int z = get8_packet_raw(f); |
1512 | if (z == EOP(-1)) { |
1513 | f->valid_bits = INVALID_BITS(-1); |
1514 | return 0; |
1515 | } |
1516 | f->acc += z << f->valid_bits; |
1517 | f->valid_bits += 8; |
1518 | } |
1519 | } |
1520 | if (f->valid_bits < 0) return 0; |
1521 | z = f->acc & ((1 << n)-1); |
1522 | f->acc >>= n; |
1523 | f->valid_bits -= n; |
1524 | return z; |
1525 | } |
1526 | |
1527 | static int32 get_bits_signed(vorb *f, int n) |
1528 | { |
1529 | uint32 z = get_bits(f, n); |
1530 | if (z & (1 << (n-1))) |
1531 | z += ~((1 << n) - 1); |
1532 | return (int32) z; |
1533 | } |
1534 | |
1535 | // @OPTIMIZE: primary accumulator for huffman |
1536 | // expand the buffer to as many bits as possible without reading off end of packet |
1537 | // it might be nice to allow f->valid_bits and f->acc to be stored in registers, |
1538 | // e.g. cache them locally and decode locally |
1539 | static __forceinlineinline void prep_huffman(vorb *f) |
1540 | { |
1541 | if (f->valid_bits <= 24) { |
1542 | if (f->valid_bits == 0) f->acc = 0; |
1543 | do { |
1544 | int z; |
1545 | if (f->last_seg && !f->bytes_in_seg) return; |
1546 | z = get8_packet_raw(f); |
1547 | if (z == EOP(-1)) return; |
1548 | f->acc += z << f->valid_bits; |
1549 | f->valid_bits += 8; |
1550 | } while (f->valid_bits <= 24); |
1551 | } |
1552 | } |
1553 | |
1554 | enum |
1555 | { |
1556 | VORBIS_packet_id = 1, |
1557 | VORBIS_packet_comment = 3, |
1558 | VORBIS_packet_setup = 5, |
1559 | }; |
1560 | |
1561 | static int codebook_decode_scalar_raw(vorb *f, Codebook *c) |
1562 | { |
1563 | int i; |
1564 | prep_huffman(f); |
1565 | |
1566 | assert(c->sorted_codewords || c->codewords)((c->sorted_codewords || c->codewords) ? (void)0 : _assert ("c->sorted_codewords || c->codewords", "src/siege/internal/stb/stb_vorbis.c" , 1566)); |
1567 | // cases to use binary search: sorted_codewords && !c->codewords |
1568 | // sorted_codewords && c->entries > 8 |
1569 | if (c->entries > 8 ? c->sorted_codewords!=NULL((void*)0) : !c->codewords) { |
1570 | // binary search |
1571 | uint32 code = bit_reverse(f->acc); |
1572 | int x=0, n=c->sorted_entries, len; |
1573 | |
1574 | while (n > 1) { |
1575 | // invariant: sc[x] <= code < sc[x+n] |
1576 | int m = x + (n >> 1); |
1577 | if (c->sorted_codewords[m] <= code) { |
1578 | x = m; |
1579 | n -= (n>>1); |
1580 | } else { |
1581 | n >>= 1; |
1582 | } |
1583 | } |
1584 | // x is now the sorted index |
1585 | if (!c->sparse) x = c->sorted_values[x]; |
1586 | // x is now sorted index if sparse, or symbol otherwise |
1587 | len = c->codeword_lengths[x]; |
1588 | if (f->valid_bits >= len) { |
1589 | f->acc >>= len; |
1590 | f->valid_bits -= len; |
1591 | return x; |
1592 | } |
1593 | |
1594 | f->valid_bits = 0; |
1595 | return -1; |
1596 | } |
1597 | |
1598 | // if small, linear search |
1599 | assert(!c->sparse)((!c->sparse) ? (void)0 : _assert("!c->sparse", "src/siege/internal/stb/stb_vorbis.c" , 1599)); |
1600 | for (i=0; i < c->entries; ++i) { |
1601 | if (c->codeword_lengths[i] == NO_CODE255) continue; |
1602 | if (c->codewords[i] == (f->acc & ((1 << c->codeword_lengths[i])-1))) { |
1603 | if (f->valid_bits >= c->codeword_lengths[i]) { |
1604 | f->acc >>= c->codeword_lengths[i]; |
1605 | f->valid_bits -= c->codeword_lengths[i]; |
1606 | return i; |
1607 | } |
1608 | f->valid_bits = 0; |
1609 | return -1; |
1610 | } |
1611 | } |
1612 | |
1613 | error(f, VORBIS_invalid_stream); |
1614 | f->valid_bits = 0; |
1615 | return -1; |
1616 | } |
1617 | |
1618 | static int codebook_decode_scalar(vorb *f, Codebook *c) |
1619 | { |
1620 | int i; |
1621 | if (f->valid_bits < STB_VORBIS_FAST_HUFFMAN_LENGTH10) |
1622 | prep_huffman(f); |
1623 | // fast huffman table lookup |
1624 | i = f->acc & FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1); |
1625 | i = c->fast_huffman[i]; |
1626 | if (i >= 0) { |
1627 | f->acc >>= c->codeword_lengths[i]; |
1628 | f->valid_bits -= c->codeword_lengths[i]; |
1629 | if (f->valid_bits < 0) { f->valid_bits = 0; return -1; } |
1630 | return i; |
1631 | } |
1632 | return codebook_decode_scalar_raw(f,c); |
1633 | } |
1634 | |
1635 | #ifndef STB_VORBIS_NO_INLINE_DECODE |
1636 | |
1637 | #define DECODE_RAW(var, f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } \ |
1638 | if (f->valid_bits < STB_VORBIS_FAST_HUFFMAN_LENGTH10) \ |
1639 | prep_huffman(f); \ |
1640 | var = f->acc & FAST_HUFFMAN_TABLE_MASK((1 << 10) - 1); \ |
1641 | var = c->fast_huffman[var]; \ |
1642 | if (var >= 0) { \ |
1643 | int n = c->codeword_lengths[var]; \ |
1644 | f->acc >>= n; \ |
1645 | f->valid_bits -= n; \ |
1646 | if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } \ |
1647 | } else { \ |
1648 | var = codebook_decode_scalar_raw(f,c); \ |
1649 | } |
1650 | |
1651 | #else |
1652 | |
1653 | #define DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } var = codebook_decode_scalar(f,c); |
1654 | |
1655 | #endif |
1656 | |
1657 | #define DECODE(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } if (c->sparse) var = c->sorted_values[var]; \ |
1658 | DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } \ |
1659 | if (c->sparse) var = c->sorted_values[var]; |
1660 | |
1661 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK |
1662 | #define DECODE_VQ(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } DECODE_RAW(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } |
1663 | #else |
1664 | #define DECODE_VQ(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } DECODE(var,f,c)if (f->valid_bits < 10) prep_huffman(f); var = f->acc & ((1 << 10) - 1); var = c->fast_huffman[var]; if (var >= 0) { int n = c->codeword_lengths[var]; f->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; var = -1; } } else { var = codebook_decode_scalar_raw (f,c); } if (c->sparse) var = c->sorted_values[var]; |
1665 | #endif |
1666 | |
1667 | |
1668 | |
1669 | |
1670 | |
1671 | |
1672 | // CODEBOOK_ELEMENT_FAST is an optimization for the CODEBOOK_FLOATS case |
1673 | // where we avoid one addition |
1674 | #ifndef STB_VORBIS_CODEBOOK_FLOATS |
1675 | #define CODEBOOK_ELEMENT(c,off)(c->multiplicands[off]) (c->multiplicands[off] * c->delta_value + c->minimum_value) |
1676 | #define CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) (c->multiplicands[off] * c->delta_value) |
1677 | #define CODEBOOK_ELEMENT_BASE(c)(0) (c->minimum_value) |
1678 | #else |
1679 | #define CODEBOOK_ELEMENT(c,off)(c->multiplicands[off]) (c->multiplicands[off]) |
1680 | #define CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) (c->multiplicands[off]) |
1681 | #define CODEBOOK_ELEMENT_BASE(c)(0) (0) |
1682 | #endif |
1683 | |
1684 | static int codebook_decode_start(vorb *f, Codebook *c, int len) |
1685 | { |
1686 | int z = -1; |
1687 | |
1688 | // type 0 is only legal in a scalar context |
1689 | if (c->lookup_type == 0) |
1690 | error(f, VORBIS_invalid_stream); |
1691 | else { |
1692 | DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); }; |
1693 | if (c->sparse) assert(z < c->sorted_entries)((z < c->sorted_entries) ? (void)0 : _assert("z < c->sorted_entries" , "src/siege/internal/stb/stb_vorbis.c", 1693)); |
1694 | if (z < 0) { // check for EOP |
1695 | if (!f->bytes_in_seg) |
1696 | if (f->last_seg) |
1697 | return z; |
1698 | error(f, VORBIS_invalid_stream); |
1699 | } |
1700 | } |
1701 | return z; |
1702 | } |
1703 | |
1704 | static int codebook_decode(vorb *f, Codebook *c, float *output, int len) |
1705 | { |
1706 | int i,z = codebook_decode_start(f,c,len); |
1707 | if (z < 0) return FALSE0; |
1708 | if (len > c->dimensions) len = c->dimensions; |
1709 | |
1710 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK |
1711 | if (c->lookup_type == 1) { |
1712 | float last = CODEBOOK_ELEMENT_BASE(c)(0); |
1713 | int div = 1; |
1714 | for (i=0; i < len; ++i) { |
1715 | int off = (z / div) % c->lookup_values; |
1716 | float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last; |
1717 | output[i] += val; |
1718 | if (c->sequence_p) last = val + c->minimum_value; |
1719 | div *= c->lookup_values; |
1720 | } |
1721 | return TRUE1; |
1722 | } |
1723 | #endif |
1724 | |
1725 | z *= c->dimensions; |
1726 | if (c->sequence_p) { |
1727 | float last = CODEBOOK_ELEMENT_BASE(c)(0); |
1728 | for (i=0; i < len; ++i) { |
1729 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1730 | output[i] += val; |
1731 | last = val + c->minimum_value; |
1732 | } |
1733 | } else { |
1734 | float last = CODEBOOK_ELEMENT_BASE(c)(0); |
1735 | for (i=0; i < len; ++i) { |
1736 | output[i] += CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1737 | } |
1738 | } |
1739 | |
1740 | return TRUE1; |
1741 | } |
1742 | |
1743 | static int codebook_decode_step(vorb *f, Codebook *c, float *output, int len, int step) |
1744 | { |
1745 | int i,z = codebook_decode_start(f,c,len); |
1746 | float last = CODEBOOK_ELEMENT_BASE(c)(0); |
1747 | if (z < 0) return FALSE0; |
1748 | if (len > c->dimensions) len = c->dimensions; |
1749 | |
1750 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK |
1751 | if (c->lookup_type == 1) { |
1752 | int div = 1; |
1753 | for (i=0; i < len; ++i) { |
1754 | int off = (z / div) % c->lookup_values; |
1755 | float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last; |
1756 | output[i*step] += val; |
1757 | if (c->sequence_p) last = val; |
1758 | div *= c->lookup_values; |
1759 | } |
1760 | return TRUE1; |
1761 | } |
1762 | #endif |
1763 | |
1764 | z *= c->dimensions; |
1765 | for (i=0; i < len; ++i) { |
1766 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1767 | output[i*step] += val; |
1768 | if (c->sequence_p) last = val; |
1769 | } |
1770 | |
1771 | return TRUE1; |
1772 | } |
1773 | |
1774 | static int codebook_decode_deinterleave_repeat(vorb *f, Codebook *c, float **outputs, int ch, int *c_inter_p, int *p_inter_p, int len, int total_decode) |
1775 | { |
1776 | int c_inter = *c_inter_p; |
1777 | int p_inter = *p_inter_p; |
1778 | int i,z, effective = c->dimensions; |
1779 | |
1780 | // type 0 is only legal in a scalar context |
1781 | if (c->lookup_type == 0) return error(f, VORBIS_invalid_stream); |
1782 | |
1783 | while (total_decode > 0) { |
1784 | float last = CODEBOOK_ELEMENT_BASE(c)(0); |
1785 | DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); }; |
1786 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK |
1787 | assert(!c->sparse || z < c->sorted_entries)((!c->sparse || z < c->sorted_entries) ? (void)0 : _assert ("!c->sparse || z < c->sorted_entries", "src/siege/internal/stb/stb_vorbis.c" , 1787)); |
1788 | #endif |
1789 | if (z < 0) { |
1790 | if (!f->bytes_in_seg) |
1791 | if (f->last_seg) return FALSE0; |
1792 | return error(f, VORBIS_invalid_stream); |
1793 | } |
1794 | |
1795 | // if this will take us off the end of the buffers, stop short! |
1796 | // we check by computing the length of the virtual interleaved |
1797 | // buffer (len*ch), our current offset within it (p_inter*ch)+(c_inter), |
1798 | // and the length we'll be using (effective) |
1799 | if (c_inter + p_inter*ch + effective > len * ch) { |
1800 | effective = len*ch - (p_inter*ch - c_inter); |
1801 | } |
1802 | |
1803 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK |
1804 | if (c->lookup_type == 1) { |
1805 | int div = 1; |
1806 | for (i=0; i < effective; ++i) { |
1807 | int off = (z / div) % c->lookup_values; |
1808 | float val = CODEBOOK_ELEMENT_FAST(c,off)(c->multiplicands[off]) + last; |
1809 | outputs[c_inter][p_inter] += val; |
1810 | if (++c_inter == ch) { c_inter = 0; ++p_inter; } |
1811 | if (c->sequence_p) last = val; |
1812 | div *= c->lookup_values; |
1813 | } |
1814 | } else |
1815 | #endif |
1816 | { |
1817 | z *= c->dimensions; |
1818 | if (c->sequence_p) { |
1819 | for (i=0; i < effective; ++i) { |
1820 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1821 | outputs[c_inter][p_inter] += val; |
1822 | if (++c_inter == ch) { c_inter = 0; ++p_inter; } |
1823 | last = val; |
1824 | } |
1825 | } else { |
1826 | for (i=0; i < effective; ++i) { |
1827 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1828 | outputs[c_inter][p_inter] += val; |
1829 | if (++c_inter == ch) { c_inter = 0; ++p_inter; } |
1830 | } |
1831 | } |
1832 | } |
1833 | |
1834 | total_decode -= effective; |
1835 | } |
1836 | *c_inter_p = c_inter; |
1837 | *p_inter_p = p_inter; |
1838 | return TRUE1; |
1839 | } |
1840 | |
1841 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK |
1842 | static int codebook_decode_deinterleave_repeat_2(vorb *f, Codebook *c, float **outputs, int *c_inter_p, int *p_inter_p, int len, int total_decode) |
1843 | { |
1844 | int c_inter = *c_inter_p; |
1845 | int p_inter = *p_inter_p; |
1846 | int i,z, effective = c->dimensions; |
1847 | |
1848 | // type 0 is only legal in a scalar context |
1849 | if (c->lookup_type == 0) return error(f, VORBIS_invalid_stream); |
1850 | |
1851 | while (total_decode > 0) { |
1852 | float last = CODEBOOK_ELEMENT_BASE(c)(0); |
1853 | DECODE_VQ(z,f,c)if (f->valid_bits < 10) prep_huffman(f); z = f->acc & ((1 << 10) - 1); z = c->fast_huffman[z]; if (z >= 0) { int n = c->codeword_lengths[z]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; z = -1; } } else { z = codebook_decode_scalar_raw (f,c); }; |
1854 | |
1855 | if (z < 0) { |
1856 | if (!f->bytes_in_seg) |
1857 | if (f->last_seg) return FALSE0; |
1858 | return error(f, VORBIS_invalid_stream); |
1859 | } |
1860 | |
1861 | // if this will take us off the end of the buffers, stop short! |
1862 | // we check by computing the length of the virtual interleaved |
1863 | // buffer (len*ch), our current offset within it (p_inter*ch)+(c_inter), |
1864 | // and the length we'll be using (effective) |
1865 | if (c_inter + p_inter*2 + effective > len * 2) { |
1866 | effective = len*2 - (p_inter*2 - c_inter); |
1867 | } |
1868 | |
1869 | { |
1870 | z *= c->dimensions; |
1871 | stb_prof(11)(void)0; |
1872 | if (c->sequence_p) { |
1873 | // haven't optimized this case because I don't have any examples |
1874 | for (i=0; i < effective; ++i) { |
1875 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1876 | outputs[c_inter][p_inter] += val; |
1877 | if (++c_inter == 2) { c_inter = 0; ++p_inter; } |
1878 | last = val; |
1879 | } |
1880 | } else { |
1881 | i=0; |
1882 | if (c_inter == 1) { |
1883 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1884 | outputs[c_inter][p_inter] += val; |
1885 | c_inter = 0; ++p_inter; |
1886 | ++i; |
1887 | } |
1888 | { |
1889 | float *z0 = outputs[0]; |
1890 | float *z1 = outputs[1]; |
1891 | for (; i+1 < effective;) { |
1892 | z0[p_inter] += CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1893 | z1[p_inter] += CODEBOOK_ELEMENT_FAST(c,z+i+1)(c->multiplicands[z+i+1]) + last; |
1894 | ++p_inter; |
1895 | i += 2; |
1896 | } |
1897 | } |
1898 | if (i < effective) { |
1899 | float val = CODEBOOK_ELEMENT_FAST(c,z+i)(c->multiplicands[z+i]) + last; |
1900 | outputs[c_inter][p_inter] += val; |
1901 | if (++c_inter == 2) { c_inter = 0; ++p_inter; } |
1902 | } |
1903 | } |
1904 | } |
1905 | |
1906 | total_decode -= effective; |
1907 | } |
1908 | *c_inter_p = c_inter; |
1909 | *p_inter_p = p_inter; |
1910 | return TRUE1; |
1911 | } |
1912 | #endif |
1913 | |
1914 | static int predict_point(int x, int x0, int x1, int y0, int y1) |
1915 | { |
1916 | int dy = y1 - y0; |
1917 | int adx = x1 - x0; |
1918 | // @OPTIMIZE: force int division to round in the right direction... is this necessary on x86? |
1919 | int err = abs(dy) * (x - x0); |
1920 | int off = err / adx; |
1921 | return dy < 0 ? y0 - off : y0 + off; |
1922 | } |
1923 | |
1924 | // the following table is block-copied from the specification |
1925 | static float inverse_db_table[256] = |
1926 | { |
1927 | 1.0649863e-07f, 1.1341951e-07f, 1.2079015e-07f, 1.2863978e-07f, |
1928 | 1.3699951e-07f, 1.4590251e-07f, 1.5538408e-07f, 1.6548181e-07f, |
1929 | 1.7623575e-07f, 1.8768855e-07f, 1.9988561e-07f, 2.1287530e-07f, |
1930 | 2.2670913e-07f, 2.4144197e-07f, 2.5713223e-07f, 2.7384213e-07f, |
1931 | 2.9163793e-07f, 3.1059021e-07f, 3.3077411e-07f, 3.5226968e-07f, |
1932 | 3.7516214e-07f, 3.9954229e-07f, 4.2550680e-07f, 4.5315863e-07f, |
1933 | 4.8260743e-07f, 5.1396998e-07f, 5.4737065e-07f, 5.8294187e-07f, |
1934 | 6.2082472e-07f, 6.6116941e-07f, 7.0413592e-07f, 7.4989464e-07f, |
1935 | 7.9862701e-07f, 8.5052630e-07f, 9.0579828e-07f, 9.6466216e-07f, |
1936 | 1.0273513e-06f, 1.0941144e-06f, 1.1652161e-06f, 1.2409384e-06f, |
1937 | 1.3215816e-06f, 1.4074654e-06f, 1.4989305e-06f, 1.5963394e-06f, |
1938 | 1.7000785e-06f, 1.8105592e-06f, 1.9282195e-06f, 2.0535261e-06f, |
1939 | 2.1869758e-06f, 2.3290978e-06f, 2.4804557e-06f, 2.6416497e-06f, |
1940 | 2.8133190e-06f, 2.9961443e-06f, 3.1908506e-06f, 3.3982101e-06f, |
1941 | 3.6190449e-06f, 3.8542308e-06f, 4.1047004e-06f, 4.3714470e-06f, |
1942 | 4.6555282e-06f, 4.9580707e-06f, 5.2802740e-06f, 5.6234160e-06f, |
1943 | 5.9888572e-06f, 6.3780469e-06f, 6.7925283e-06f, 7.2339451e-06f, |
1944 | 7.7040476e-06f, 8.2047000e-06f, 8.7378876e-06f, 9.3057248e-06f, |
1945 | 9.9104632e-06f, 1.0554501e-05f, 1.1240392e-05f, 1.1970856e-05f, |
1946 | 1.2748789e-05f, 1.3577278e-05f, 1.4459606e-05f, 1.5399272e-05f, |
1947 | 1.6400004e-05f, 1.7465768e-05f, 1.8600792e-05f, 1.9809576e-05f, |
1948 | 2.1096914e-05f, 2.2467911e-05f, 2.3928002e-05f, 2.5482978e-05f, |
1949 | 2.7139006e-05f, 2.8902651e-05f, 3.0780908e-05f, 3.2781225e-05f, |
1950 | 3.4911534e-05f, 3.7180282e-05f, 3.9596466e-05f, 4.2169667e-05f, |
1951 | 4.4910090e-05f, 4.7828601e-05f, 5.0936773e-05f, 5.4246931e-05f, |
1952 | 5.7772202e-05f, 6.1526565e-05f, 6.5524908e-05f, 6.9783085e-05f, |
1953 | 7.4317983e-05f, 7.9147585e-05f, 8.4291040e-05f, 8.9768747e-05f, |
1954 | 9.5602426e-05f, 0.00010181521f, 0.00010843174f, 0.00011547824f, |
1955 | 0.00012298267f, 0.00013097477f, 0.00013948625f, 0.00014855085f, |
1956 | 0.00015820453f, 0.00016848555f, 0.00017943469f, 0.00019109536f, |
1957 | 0.00020351382f, 0.00021673929f, 0.00023082423f, 0.00024582449f, |
1958 | 0.00026179955f, 0.00027881276f, 0.00029693158f, 0.00031622787f, |
1959 | 0.00033677814f, 0.00035866388f, 0.00038197188f, 0.00040679456f, |
1960 | 0.00043323036f, 0.00046138411f, 0.00049136745f, 0.00052329927f, |
1961 | 0.00055730621f, 0.00059352311f, 0.00063209358f, 0.00067317058f, |
1962 | 0.00071691700f, 0.00076350630f, 0.00081312324f, 0.00086596457f, |
1963 | 0.00092223983f, 0.00098217216f, 0.0010459992f, 0.0011139742f, |
1964 | 0.0011863665f, 0.0012634633f, 0.0013455702f, 0.0014330129f, |
1965 | 0.0015261382f, 0.0016253153f, 0.0017309374f, 0.0018434235f, |
1966 | 0.0019632195f, 0.0020908006f, 0.0022266726f, 0.0023713743f, |
1967 | 0.0025254795f, 0.0026895994f, 0.0028643847f, 0.0030505286f, |
1968 | 0.0032487691f, 0.0034598925f, 0.0036847358f, 0.0039241906f, |
1969 | 0.0041792066f, 0.0044507950f, 0.0047400328f, 0.0050480668f, |
1970 | 0.0053761186f, 0.0057254891f, 0.0060975636f, 0.0064938176f, |
1971 | 0.0069158225f, 0.0073652516f, 0.0078438871f, 0.0083536271f, |
1972 | 0.0088964928f, 0.009474637f, 0.010090352f, 0.010746080f, |
1973 | 0.011444421f, 0.012188144f, 0.012980198f, 0.013823725f, |
1974 | 0.014722068f, 0.015678791f, 0.016697687f, 0.017782797f, |
1975 | 0.018938423f, 0.020169149f, 0.021479854f, 0.022875735f, |
1976 | 0.024362330f, 0.025945531f, 0.027631618f, 0.029427276f, |
1977 | 0.031339626f, 0.033376252f, 0.035545228f, 0.037855157f, |
1978 | 0.040315199f, 0.042935108f, 0.045725273f, 0.048696758f, |
1979 | 0.051861348f, 0.055231591f, 0.058820850f, 0.062643361f, |
1980 | 0.066714279f, 0.071049749f, 0.075666962f, 0.080584227f, |
1981 | 0.085821044f, 0.091398179f, 0.097337747f, 0.10366330f, |
1982 | 0.11039993f, 0.11757434f, 0.12521498f, 0.13335215f, |
1983 | 0.14201813f, 0.15124727f, 0.16107617f, 0.17154380f, |
1984 | 0.18269168f, 0.19456402f, 0.20720788f, 0.22067342f, |
1985 | 0.23501402f, 0.25028656f, 0.26655159f, 0.28387361f, |
1986 | 0.30232132f, 0.32196786f, 0.34289114f, 0.36517414f, |
1987 | 0.38890521f, 0.41417847f, 0.44109412f, 0.46975890f, |
1988 | 0.50028648f, 0.53279791f, 0.56742212f, 0.60429640f, |
1989 | 0.64356699f, 0.68538959f, 0.72993007f, 0.77736504f, |
1990 | 0.82788260f, 0.88168307f, 0.9389798f, 1.0f |
1991 | }; |
1992 | |
1993 | |
1994 | // @OPTIMIZE: if you want to replace this bresenham line-drawing routine, |
1995 | // note that you must produce bit-identical output to decode correctly; |
1996 | // this specific sequence of operations is specified in the spec (it's |
1997 | // drawing integer-quantized frequency-space lines that the encoder |
1998 | // expects to be exactly the same) |
1999 | // ... also, isn't the whole point of Bresenham's algorithm to NOT |
2000 | // have to divide in the setup? sigh. |
2001 | #ifndef STB_VORBIS_NO_DEFER_FLOOR |
2002 | #define LINE_OP(a,b)a *= b a *= b |
2003 | #else |
2004 | #define LINE_OP(a,b)a *= b a = b |
2005 | #endif |
2006 | |
2007 | #ifdef STB_VORBIS_DIVIDE_TABLE |
2008 | #define DIVTAB_NUMER 32 |
2009 | #define DIVTAB_DENOM 64 |
2010 | int8 integer_divide_table[DIVTAB_NUMER][DIVTAB_DENOM]; // 2KB |
2011 | #endif |
2012 | |
2013 | static __forceinlineinline void draw_line(float *output, int x0, int y0, int x1, int y1, int n) |
2014 | { |
2015 | int dy = y1 - y0; |
2016 | int adx = x1 - x0; |
2017 | int ady = abs(dy); |
2018 | int base; |
2019 | int x=x0,y=y0; |
2020 | int err = 0; |
2021 | int sy; |
2022 | |
2023 | #ifdef STB_VORBIS_DIVIDE_TABLE |
2024 | if (adx < DIVTAB_DENOM && ady < DIVTAB_NUMER) { |
2025 | if (dy < 0) { |
2026 | base = -integer_divide_table[ady][adx]; |
2027 | sy = base-1; |
2028 | } else { |
2029 | base = integer_divide_table[ady][adx]; |
2030 | sy = base+1; |
2031 | } |
2032 | } else { |
2033 | base = dy / adx; |
2034 | if (dy < 0) |
2035 | sy = base - 1; |
2036 | else |
2037 | sy = base+1; |
2038 | } |
2039 | #else |
2040 | base = dy / adx; |
2041 | if (dy < 0) |
2042 | sy = base - 1; |
2043 | else |
2044 | sy = base+1; |
2045 | #endif |
2046 | ady -= abs(base) * adx; |
2047 | if (x1 > n) x1 = n; |
2048 | LINE_OP(output[x], inverse_db_table[y])output[x] *= inverse_db_table[y]; |
2049 | for (++x; x < x1; ++x) { |
2050 | err += ady; |
2051 | if (err >= adx) { |
2052 | err -= adx; |
2053 | y += sy; |
2054 | } else |
2055 | y += base; |
2056 | LINE_OP(output[x], inverse_db_table[y])output[x] *= inverse_db_table[y]; |
2057 | } |
2058 | } |
2059 | |
2060 | static int residue_decode(vorb *f, Codebook *book, float *target, int offset, int n, int rtype) |
2061 | { |
2062 | int k; |
2063 | if (rtype == 0) { |
2064 | int step = n / book->dimensions; |
2065 | for (k=0; k < step; ++k) |
2066 | if (!codebook_decode_step(f, book, target+offset+k, n-offset-k, step)) |
2067 | return FALSE0; |
2068 | } else { |
2069 | for (k=0; k < n; ) { |
2070 | if (!codebook_decode(f, book, target+offset, n-k)) |
2071 | return FALSE0; |
2072 | k += book->dimensions; |
2073 | offset += book->dimensions; |
2074 | } |
2075 | } |
2076 | return TRUE1; |
2077 | } |
2078 | |
2079 | static void decode_residue(vorb *f, float *residue_buffers[], int ch, int n, int rn, uint8 *do_not_decode) |
2080 | { |
2081 | int i,j,pass; |
2082 | Residue *r = f->residue_config + rn; |
2083 | int rtype = f->residue_types[rn]; |
2084 | int c = r->classbook; |
2085 | int classwords = f->codebooks[c].dimensions; |
2086 | int n_read = r->end - r->begin; |
2087 | int part_read = n_read / r->part_size; |
2088 | int temp_alloc_point = temp_alloc_save(f)((f)->temp_offset); |
2089 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2090 | uint8 ***part_classdata = (uint8 ***) temp_block_array(f,f->channels, part_read * sizeof(**part_classdata))make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(f->channels*(sizeof(void *)+(part_read * sizeof(**part_classdata ))))) : alloca((f->channels*(sizeof(void *)+(part_read * sizeof (**part_classdata)))))), f->channels, part_read * sizeof(* *part_classdata)); |
2091 | #else |
2092 | int **classifications = (int **) temp_block_array(f,f->channels, part_read * sizeof(**classifications))make_block_array((f->alloc.alloc_buffer ? setup_temp_malloc (f,(f->channels*(sizeof(void *)+(part_read * sizeof(**classifications ))))) : alloca((f->channels*(sizeof(void *)+(part_read * sizeof (**classifications)))))), f->channels, part_read * sizeof( **classifications)); |
2093 | #endif |
2094 | |
2095 | stb_prof(2)(void)0; |
2096 | for (i=0; i < ch; ++i) |
2097 | if (!do_not_decode[i]) |
2098 | memset(residue_buffers[i], 0, sizeof(float) * n); |
2099 | |
2100 | if (rtype == 2 && ch != 1) { |
2101 | int len = ch * n; |
2102 | (void)len; |
2103 | for (j=0; j < ch; ++j) |
2104 | if (!do_not_decode[j]) |
2105 | break; |
2106 | if (j == ch) |
2107 | goto done; |
2108 | |
2109 | stb_prof(3)(void)0; |
2110 | for (pass=0; pass < 8; ++pass) { |
2111 | int pcount = 0, class_set = 0; |
2112 | if (ch == 2) { |
2113 | stb_prof(13)(void)0; |
2114 | while (pcount < part_read) { |
2115 | int z = r->begin + pcount*r->part_size; |
2116 | int c_inter = (z & 1), p_inter = z>>1; |
2117 | if (pass == 0) { |
2118 | Codebook *c = f->codebooks+r->classbook; |
2119 | int q; |
2120 | DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];; |
2121 | if (q == EOP(-1)) goto done; |
2122 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2123 | part_classdata[0][class_set] = r->classdata[q]; |
2124 | #else |
2125 | for (i=classwords-1; i >= 0; --i) { |
2126 | classifications[0][i+pcount] = q % r->classifications; |
2127 | q /= r->classifications; |
2128 | } |
2129 | #endif |
2130 | } |
2131 | stb_prof(5)(void)0; |
2132 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { |
2133 | int z = r->begin + pcount*r->part_size; |
2134 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2135 | int c = part_classdata[0][class_set][i]; |
2136 | #else |
2137 | int c = classifications[0][pcount]; |
2138 | #endif |
2139 | int b = r->residue_books[c][pass]; |
2140 | if (b >= 0) { |
2141 | Codebook *book = f->codebooks + b; |
2142 | stb_prof(20)(void)0; // accounts for X time |
2143 | #ifdef STB_VORBIS_DIVIDES_IN_CODEBOOK |
2144 | if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size)) |
2145 | goto done; |
2146 | #else |
2147 | // saves 1% |
2148 | if (!codebook_decode_deinterleave_repeat_2(f, book, residue_buffers, &c_inter, &p_inter, n, r->part_size)) |
2149 | goto done; |
2150 | #endif |
2151 | stb_prof(7)(void)0; |
2152 | } else { |
2153 | z += r->part_size; |
2154 | c_inter = z & 1; |
2155 | p_inter = z >> 1; |
2156 | } |
2157 | } |
2158 | stb_prof(8)(void)0; |
2159 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2160 | ++class_set; |
2161 | #endif |
2162 | } |
2163 | } else if (ch == 1) { |
2164 | while (pcount < part_read) { |
2165 | int z = r->begin + pcount*r->part_size; |
2166 | int c_inter = 0, p_inter = z; |
2167 | if (pass == 0) { |
2168 | Codebook *c = f->codebooks+r->classbook; |
2169 | int q; |
2170 | DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];; |
2171 | if (q == EOP(-1)) goto done; |
2172 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2173 | part_classdata[0][class_set] = r->classdata[q]; |
2174 | #else |
2175 | for (i=classwords-1; i >= 0; --i) { |
2176 | classifications[0][i+pcount] = q % r->classifications; |
2177 | q /= r->classifications; |
2178 | } |
2179 | #endif |
2180 | } |
2181 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { |
2182 | int z = r->begin + pcount*r->part_size; |
2183 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2184 | int c = part_classdata[0][class_set][i]; |
2185 | #else |
2186 | int c = classifications[0][pcount]; |
2187 | #endif |
2188 | int b = r->residue_books[c][pass]; |
2189 | if (b >= 0) { |
2190 | Codebook *book = f->codebooks + b; |
2191 | stb_prof(22)(void)0; |
2192 | if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size)) |
2193 | goto done; |
2194 | stb_prof(3)(void)0; |
2195 | } else { |
2196 | z += r->part_size; |
2197 | c_inter = 0; |
2198 | p_inter = z; |
2199 | } |
2200 | } |
2201 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2202 | ++class_set; |
2203 | #endif |
2204 | } |
2205 | } else { |
2206 | while (pcount < part_read) { |
2207 | int z = r->begin + pcount*r->part_size; |
2208 | int c_inter = z % ch, p_inter = z/ch; |
2209 | if (pass == 0) { |
2210 | Codebook *c = f->codebooks+r->classbook; |
2211 | int q; |
2212 | DECODE(q,f,c)if (f->valid_bits < 10) prep_huffman(f); q = f->acc & ((1 << 10) - 1); q = c->fast_huffman[q]; if (q >= 0) { int n = c->codeword_lengths[q]; f->acc >>= n ; f->valid_bits -= n; if (f->valid_bits < 0) { f-> valid_bits = 0; q = -1; } } else { q = codebook_decode_scalar_raw (f,c); } if (c->sparse) q = c->sorted_values[q];; |
2213 | if (q == EOP(-1)) goto done; |
2214 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2215 | part_classdata[0][class_set] = r->classdata[q]; |
2216 | #else |
2217 | for (i=classwords-1; i >= 0; --i) { |
2218 | classifications[0][i+pcount] = q % r->classifications; |
2219 | q /= r->classifications; |
2220 | } |
2221 | #endif |
2222 | } |
2223 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { |
2224 | int z = r->begin + pcount*r->part_size; |
2225 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2226 | int c = part_classdata[0][class_set][i]; |
2227 | #else |
2228 | int c = classifications[0][pcount]; |
2229 | #endif |
2230 | int b = r->residue_books[c][pass]; |
2231 | if (b >= 0) { |
2232 | Codebook *book = f->codebooks + b; |
2233 | stb_prof(22)(void)0; |
2234 | if (!codebook_decode_deinterleave_repeat(f, book, residue_buffers, ch, &c_inter, &p_inter, n, r->part_size)) |
2235 | goto done; |
2236 | stb_prof(3)(void)0; |
2237 | } else { |
2238 | z += r->part_size; |
2239 | c_inter = z % ch; |
2240 | p_inter = z / ch; |
2241 | } |
2242 | } |
2243 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2244 | ++class_set; |
2245 | #endif |
2246 | } |
2247 | } |
2248 | } |
2249 | goto done; |
2250 | } |
2251 | stb_prof(9)(void)0; |
2252 | |
2253 | for (pass=0; pass < 8; ++pass) { |
2254 | int pcount = 0, class_set=0; |
2255 | while (pcount < part_read) { |
2256 | if (pass == 0) { |
2257 | for (j=0; j < ch; ++j) { |
2258 | if (!do_not_decode[j]) { |
2259 | Codebook *c = f->codebooks+r->classbook; |
2260 | int temp; |
2261 | DECODE(temp,f,c)if (f->valid_bits < 10) prep_huffman(f); temp = f->acc & ((1 << 10) - 1); temp = c->fast_huffman[temp] ; if (temp >= 0) { int n = c->codeword_lengths[temp]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; temp = -1; } } else { temp = codebook_decode_scalar_raw(f,c); } if (c->sparse) temp = c ->sorted_values[temp];; |
2262 | if (temp == EOP(-1)) goto done; |
2263 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2264 | part_classdata[j][class_set] = r->classdata[temp]; |
2265 | #else |
2266 | for (i=classwords-1; i >= 0; --i) { |
2267 | classifications[j][i+pcount] = temp % r->classifications; |
2268 | temp /= r->classifications; |
2269 | } |
2270 | #endif |
2271 | } |
2272 | } |
2273 | } |
2274 | for (i=0; i < classwords && pcount < part_read; ++i, ++pcount) { |
2275 | for (j=0; j < ch; ++j) { |
2276 | if (!do_not_decode[j]) { |
2277 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2278 | int c = part_classdata[j][class_set][i]; |
2279 | #else |
2280 | int c = classifications[j][pcount]; |
2281 | #endif |
2282 | int b = r->residue_books[c][pass]; |
2283 | if (b >= 0) { |
2284 | float *target = residue_buffers[j]; |
2285 | int offset = r->begin + pcount * r->part_size; |
2286 | int n = r->part_size; |
2287 | Codebook *book = f->codebooks + b; |
2288 | if (!residue_decode(f, book, target, offset, n, rtype)) |
2289 | goto done; |
2290 | } |
2291 | } |
2292 | } |
2293 | } |
2294 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
2295 | ++class_set; |
2296 | #endif |
2297 | } |
2298 | } |
2299 | done: |
2300 | stb_prof(0)(void)0; |
2301 | temp_alloc_restore(f,temp_alloc_point)((f)->temp_offset = (temp_alloc_point)); |
2302 | } |
2303 | |
2304 | |
2305 | #if 0 |
2306 | // slow way for debugging |
2307 | void inverse_mdct_slow(float *buffer, int n) |
2308 | { |
2309 | int i,j; |
2310 | int n2 = n >> 1; |
2311 | float *x = (float *) malloc(sizeof(*x) * n2); |
2312 | memcpy(x, buffer, sizeof(*x) * n2); |
2313 | for (i=0; i < n; ++i) { |
2314 | float acc = 0; |
2315 | for (j=0; j < n2; ++j) |
2316 | // formula from paper: |
2317 | //acc += n/4.0f * x[j] * (float) cos(M_PI / 2 / n * (2 * i + 1 + n/2.0)*(2*j+1)); |
2318 | // formula from wikipedia |
2319 | //acc += 2.0f / n2 * x[j] * (float) cos(M_PI/n2 * (i + 0.5 + n2/2)*(j + 0.5)); |
2320 | // these are equivalent, except the formula from the paper inverts the multiplier! |
2321 | // however, what actually works is NO MULTIPLIER!?! |
2322 | //acc += 64 * 2.0f / n2 * x[j] * (float) cos(M_PI/n2 * (i + 0.5 + n2/2)*(j + 0.5)); |
2323 | acc += x[j] * (float) cos(M_PI3.14159265358979323846 / 2 / n * (2 * i + 1 + n/2.0)*(2*j+1)); |
2324 | buffer[i] = acc; |
2325 | } |
2326 | free(x); |
2327 | } |
2328 | #elif 0 |
2329 | // same as above, but just barely able to run in real time on modern machines |
2330 | void inverse_mdct_slow(float *buffer, int n, vorb *f, int blocktype) |
2331 | { |
2332 | float mcos[16384]; |
2333 | int i,j; |
2334 | int n2 = n >> 1, nmask = (n << 2) -1; |
2335 | float *x = (float *) malloc(sizeof(*x) * n2); |
2336 | memcpy(x, buffer, sizeof(*x) * n2); |
2337 | for (i=0; i < 4*n; ++i) |
2338 | mcos[i] = (float) cos(M_PI3.14159265358979323846 / 2 * i / n); |
2339 | |
2340 | for (i=0; i < n; ++i) { |
2341 | float acc = 0; |
2342 | for (j=0; j < n2; ++j) |
2343 | acc += x[j] * mcos[(2 * i + 1 + n2)*(2*j+1) & nmask]; |
2344 | buffer[i] = acc; |
2345 | } |
2346 | free(x); |
2347 | } |
2348 | #else |
2349 | // transform to use a slow dct-iv; this is STILL basically trivial, |
2350 | // but only requires half as many ops |
2351 | void dct_iv_slow(float *buffer, int n) |
2352 | { |
2353 | float mcos[16384]; |
2354 | float x[2048]; |
2355 | int i,j; |
2356 | int n2 = n >> 1, nmask = (n << 3) - 1; |
2357 | (void)n2; |
2358 | memcpy(x, buffer, sizeof(*x) * n); |
2359 | for (i=0; i < 8*n; ++i) |
2360 | mcos[i] = (float) cos(M_PI3.14159265358979323846 / 4 * i / n); |
2361 | for (i=0; i < n; ++i) { |
2362 | float acc = 0; |
2363 | for (j=0; j < n; ++j) |
2364 | acc += x[j] * mcos[((2 * i + 1)*(2*j+1)) & nmask]; |
2365 | //acc += x[j] * cos(M_PI / n * (i + 0.5) * (j + 0.5)); |
2366 | buffer[i] = acc; |
2367 | } |
2368 | } |
2369 | |
2370 | void inverse_mdct_slow(float *buffer, int n, vorb *f, int blocktype) |
2371 | { |
2372 | int i, n4 = n >> 2, n2 = n >> 1, n3_4 = n - n4; |
2373 | float temp[4096]; |
2374 | |
2375 | memcpy(temp, buffer, n2 * sizeof(float)); |
2376 | dct_iv_slow(temp, n2); // returns -c'-d, a-b' |
2377 | |
2378 | for (i=0; i < n4 ; ++i) buffer[i] = temp[i+n4]; // a-b' |
2379 | for ( ; i < n3_4; ++i) buffer[i] = -temp[n3_4 - i - 1]; // b-a', c+d' |
2380 | for ( ; i < n ; ++i) buffer[i] = -temp[i - n3_4]; // c'+d |
2381 | } |
2382 | #endif |
2383 | |
2384 | #ifndef LIBVORBIS_MDCT0 |
2385 | #define LIBVORBIS_MDCT0 0 |
2386 | #endif |
2387 | |
2388 | #if LIBVORBIS_MDCT0 |
2389 | // directly call the vorbis MDCT using an interface documented |
2390 | // by Jeff Roberts... useful for performance comparison |
2391 | typedef struct |
2392 | { |
2393 | int n; |
2394 | int log2n; |
2395 | |
2396 | float *trig; |
2397 | int *bitrev; |
2398 | |
2399 | float scale; |
2400 | } mdct_lookup; |
2401 | |
2402 | extern void mdct_init(mdct_lookup *lookup, int n); |
2403 | extern void mdct_clear(mdct_lookup *l); |
2404 | extern void mdct_backward(mdct_lookup *init, float *in, float *out); |
2405 | |
2406 | mdct_lookup M1,M2; |
2407 | |
2408 | void inverse_mdct(float *buffer, int n, vorb *f, int blocktype) |
2409 | { |
2410 | mdct_lookup *M; |
2411 | if (M1.n == n) M = &M1; |
2412 | else if (M2.n == n) M = &M2; |
2413 | else if (M1.n == 0) { mdct_init(&M1, n); M = &M1; } |
2414 | else { |
2415 | if (M2.n) __asm int 3; |
2416 | mdct_init(&M2, n); |
2417 | M = &M2; |
2418 | } |
2419 | |
2420 | mdct_backward(M, buffer, buffer); |
2421 | } |
2422 | #endif |
2423 | |
2424 | |
2425 | // the following were split out into separate functions while optimizing; |
2426 | // they could be pushed back up but eh. __forceinline showed no change; |
2427 | // they're probably already being inlined. |
2428 | static void imdct_step3_iter0_loop(int n, float *e, int i_off, int k_off, float *A) |
2429 | { |
2430 | float *ee0 = e + i_off; |
2431 | float *ee2 = ee0 + k_off; |
2432 | int i; |
2433 | |
2434 | assert((n & 3) == 0)(((n & 3) == 0) ? (void)0 : _assert("(n & 3) == 0", "src/siege/internal/stb/stb_vorbis.c" , 2434)); |
2435 | for (i=(n>>2); i > 0; --i) { |
2436 | float k00_20, k01_21; |
2437 | k00_20 = ee0[ 0] - ee2[ 0]; |
2438 | k01_21 = ee0[-1] - ee2[-1]; |
2439 | ee0[ 0] += ee2[ 0];//ee0[ 0] = ee0[ 0] + ee2[ 0]; |
2440 | ee0[-1] += ee2[-1];//ee0[-1] = ee0[-1] + ee2[-1]; |
2441 | ee2[ 0] = k00_20 * A[0] - k01_21 * A[1]; |
2442 | ee2[-1] = k01_21 * A[0] + k00_20 * A[1]; |
2443 | A += 8; |
2444 | |
2445 | k00_20 = ee0[-2] - ee2[-2]; |
2446 | k01_21 = ee0[-3] - ee2[-3]; |
2447 | ee0[-2] += ee2[-2];//ee0[-2] = ee0[-2] + ee2[-2]; |
2448 | ee0[-3] += ee2[-3];//ee0[-3] = ee0[-3] + ee2[-3]; |
2449 | ee2[-2] = k00_20 * A[0] - k01_21 * A[1]; |
2450 | ee2[-3] = k01_21 * A[0] + k00_20 * A[1]; |
2451 | A += 8; |
2452 | |
2453 | k00_20 = ee0[-4] - ee2[-4]; |
2454 | k01_21 = ee0[-5] - ee2[-5]; |
2455 | ee0[-4] += ee2[-4];//ee0[-4] = ee0[-4] + ee2[-4]; |
2456 | ee0[-5] += ee2[-5];//ee0[-5] = ee0[-5] + ee2[-5]; |
2457 | ee2[-4] = k00_20 * A[0] - k01_21 * A[1]; |
2458 | ee2[-5] = k01_21 * A[0] + k00_20 * A[1]; |
2459 | A += 8; |
2460 | |
2461 | k00_20 = ee0[-6] - ee2[-6]; |
2462 | k01_21 = ee0[-7] - ee2[-7]; |
2463 | ee0[-6] += ee2[-6];//ee0[-6] = ee0[-6] + ee2[-6]; |
2464 | ee0[-7] += ee2[-7];//ee0[-7] = ee0[-7] + ee2[-7]; |
2465 | ee2[-6] = k00_20 * A[0] - k01_21 * A[1]; |
2466 | ee2[-7] = k01_21 * A[0] + k00_20 * A[1]; |
2467 | A += 8; |
2468 | ee0 -= 8; |
2469 | ee2 -= 8; |
2470 | } |
2471 | } |
2472 | |
2473 | static void imdct_step3_inner_r_loop(int lim, float *e, int d0, int k_off, float *A, int k1) |
2474 | { |
2475 | int i; |
2476 | float k00_20, k01_21; |
2477 | |
2478 | float *e0 = e + d0; |
2479 | float *e2 = e0 + k_off; |
2480 | |
2481 | for (i=lim >> 2; i > 0; --i) { |
2482 | k00_20 = e0[-0] - e2[-0]; |
2483 | k01_21 = e0[-1] - e2[-1]; |
2484 | e0[-0] += e2[-0];//e0[-0] = e0[-0] + e2[-0]; |
2485 | e0[-1] += e2[-1];//e0[-1] = e0[-1] + e2[-1]; |
2486 | e2[-0] = (k00_20)*A[0] - (k01_21) * A[1]; |
2487 | e2[-1] = (k01_21)*A[0] + (k00_20) * A[1]; |
2488 | |
2489 | A += k1; |
2490 | |
2491 | k00_20 = e0[-2] - e2[-2]; |
2492 | k01_21 = e0[-3] - e2[-3]; |
2493 | e0[-2] += e2[-2];//e0[-2] = e0[-2] + e2[-2]; |
2494 | e0[-3] += e2[-3];//e0[-3] = e0[-3] + e2[-3]; |
2495 | e2[-2] = (k00_20)*A[0] - (k01_21) * A[1]; |
2496 | e2[-3] = (k01_21)*A[0] + (k00_20) * A[1]; |
2497 | |
2498 | A += k1; |
2499 | |
2500 | k00_20 = e0[-4] - e2[-4]; |
2501 | k01_21 = e0[-5] - e2[-5]; |
2502 | e0[-4] += e2[-4];//e0[-4] = e0[-4] + e2[-4]; |
2503 | e0[-5] += e2[-5];//e0[-5] = e0[-5] + e2[-5]; |
2504 | e2[-4] = (k00_20)*A[0] - (k01_21) * A[1]; |
2505 | e2[-5] = (k01_21)*A[0] + (k00_20) * A[1]; |
2506 | |
2507 | A += k1; |
2508 | |
2509 | k00_20 = e0[-6] - e2[-6]; |
2510 | k01_21 = e0[-7] - e2[-7]; |
2511 | e0[-6] += e2[-6];//e0[-6] = e0[-6] + e2[-6]; |
2512 | e0[-7] += e2[-7];//e0[-7] = e0[-7] + e2[-7]; |
2513 | e2[-6] = (k00_20)*A[0] - (k01_21) * A[1]; |
2514 | e2[-7] = (k01_21)*A[0] + (k00_20) * A[1]; |
2515 | |
2516 | e0 -= 8; |
2517 | e2 -= 8; |
2518 | |
2519 | A += k1; |
2520 | } |
2521 | } |
2522 | |
2523 | static void imdct_step3_inner_s_loop(int n, float *e, int i_off, int k_off, float *A, int a_off, int k0) |
2524 | { |
2525 | int i; |
2526 | float A0 = A[0]; |
2527 | float A1 = A[0+1]; |
2528 | float A2 = A[0+a_off]; |
2529 | float A3 = A[0+a_off+1]; |
2530 | float A4 = A[0+a_off*2+0]; |
2531 | float A5 = A[0+a_off*2+1]; |
2532 | float A6 = A[0+a_off*3+0]; |
2533 | float A7 = A[0+a_off*3+1]; |
2534 | |
2535 | float k00,k11; |
2536 | |
2537 | float *ee0 = e +i_off; |
2538 | float *ee2 = ee0+k_off; |
2539 | |
2540 | for (i=n; i > 0; --i) { |
2541 | k00 = ee0[ 0] - ee2[ 0]; |
2542 | k11 = ee0[-1] - ee2[-1]; |
2543 | ee0[ 0] = ee0[ 0] + ee2[ 0]; |
2544 | ee0[-1] = ee0[-1] + ee2[-1]; |
2545 | ee2[ 0] = (k00) * A0 - (k11) * A1; |
2546 | ee2[-1] = (k11) * A0 + (k00) * A1; |
2547 | |
2548 | k00 = ee0[-2] - ee2[-2]; |
2549 | k11 = ee0[-3] - ee2[-3]; |
2550 | ee0[-2] = ee0[-2] + ee2[-2]; |
2551 | ee0[-3] = ee0[-3] + ee2[-3]; |
2552 | ee2[-2] = (k00) * A2 - (k11) * A3; |
2553 | ee2[-3] = (k11) * A2 + (k00) * A3; |
2554 | |
2555 | k00 = ee0[-4] - ee2[-4]; |
2556 | k11 = ee0[-5] - ee2[-5]; |
2557 | ee0[-4] = ee0[-4] + ee2[-4]; |
2558 | ee0[-5] = ee0[-5] + ee2[-5]; |
2559 | ee2[-4] = (k00) * A4 - (k11) * A5; |
2560 | ee2[-5] = (k11) * A4 + (k00) * A5; |
2561 | |
2562 | k00 = ee0[-6] - ee2[-6]; |
2563 | k11 = ee0[-7] - ee2[-7]; |
2564 | ee0[-6] = ee0[-6] + ee2[-6]; |
2565 | ee0[-7] = ee0[-7] + ee2[-7]; |
2566 | ee2[-6] = (k00) * A6 - (k11) * A7; |
2567 | ee2[-7] = (k11) * A6 + (k00) * A7; |
2568 | |
2569 | ee0 -= k0; |
2570 | ee2 -= k0; |
2571 | } |
2572 | } |
2573 | |
2574 | static __forceinlineinline void iter_54(float *z) |
2575 | { |
2576 | float k00,k11,k22,k33; |
2577 | float y0,y1,y2,y3; |
2578 | |
2579 | k00 = z[ 0] - z[-4]; |
2580 | y0 = z[ 0] + z[-4]; |
2581 | y2 = z[-2] + z[-6]; |
2582 | k22 = z[-2] - z[-6]; |
2583 | |
2584 | z[-0] = y0 + y2; // z0 + z4 + z2 + z6 |
2585 | z[-2] = y0 - y2; // z0 + z4 - z2 - z6 |
2586 | |
2587 | // done with y0,y2 |
2588 | |
2589 | k33 = z[-3] - z[-7]; |
2590 | |
2591 | z[-4] = k00 + k33; // z0 - z4 + z3 - z7 |
2592 | z[-6] = k00 - k33; // z0 - z4 - z3 + z7 |
2593 | |
2594 | // done with k33 |
2595 | |
2596 | k11 = z[-1] - z[-5]; |
2597 | y1 = z[-1] + z[-5]; |
2598 | y3 = z[-3] + z[-7]; |
2599 | |
2600 | z[-1] = y1 + y3; // z1 + z5 + z3 + z7 |
2601 | z[-3] = y1 - y3; // z1 + z5 - z3 - z7 |
2602 | z[-5] = k11 - k22; // z1 - z5 + z2 - z6 |
2603 | z[-7] = k11 + k22; // z1 - z5 - z2 + z6 |
2604 | } |
2605 | |
2606 | static void imdct_step3_inner_s_loop_ld654(int n, float *e, int i_off, float *A, int base_n) |
2607 | { |
2608 | int k_off = -8; |
2609 | (void)k_off; |
2610 | int a_off = base_n >> 3; |
2611 | float A2 = A[0+a_off]; |
2612 | float *z = e + i_off; |
2613 | float *base = z - 16 * n; |
2614 | |
2615 | while (z > base) { |
2616 | float k00,k11; |
2617 | |
2618 | k00 = z[-0] - z[-8]; |
2619 | k11 = z[-1] - z[-9]; |
2620 | z[-0] = z[-0] + z[-8]; |
2621 | z[-1] = z[-1] + z[-9]; |
2622 | z[-8] = k00; |
2623 | z[-9] = k11 ; |
2624 | |
2625 | k00 = z[ -2] - z[-10]; |
2626 | k11 = z[ -3] - z[-11]; |
2627 | z[ -2] = z[ -2] + z[-10]; |
2628 | z[ -3] = z[ -3] + z[-11]; |
2629 | z[-10] = (k00+k11) * A2; |
2630 | z[-11] = (k11-k00) * A2; |
2631 | |
2632 | k00 = z[-12] - z[ -4]; // reverse to avoid a unary negation |
2633 | k11 = z[ -5] - z[-13]; |
2634 | z[ -4] = z[ -4] + z[-12]; |
2635 | z[ -5] = z[ -5] + z[-13]; |
2636 | z[-12] = k11; |
2637 | z[-13] = k00; |
2638 | |
2639 | k00 = z[-14] - z[ -6]; // reverse to avoid a unary negation |
2640 | k11 = z[ -7] - z[-15]; |
2641 | z[ -6] = z[ -6] + z[-14]; |
2642 | z[ -7] = z[ -7] + z[-15]; |
2643 | z[-14] = (k00+k11) * A2; |
2644 | z[-15] = (k00-k11) * A2; |
2645 | |
2646 | iter_54(z); |
2647 | iter_54(z-8); |
2648 | z -= 16; |
2649 | } |
2650 | } |
2651 | |
2652 | static void inverse_mdct(float *buffer, int n, vorb *f, int blocktype) |
2653 | { |
2654 | int n2 = n >> 1, n4 = n >> 2, n8 = n >> 3, l; |
2655 | int n3_4 = n - n4, ld; |
2656 | (void)n3_4; |
2657 | // @OPTIMIZE: reduce register pressure by using fewer variables? |
2658 | int save_point = temp_alloc_save(f)((f)->temp_offset); |
2659 | float *buf2 = (float *) temp_alloc(f, n2 * sizeof(*buf2))(f->alloc.alloc_buffer ? setup_temp_malloc(f,n2 * sizeof(* buf2)) : alloca(n2 * sizeof(*buf2))); |
2660 | float *u=NULL((void*)0),*v=NULL((void*)0); |
2661 | // twiddle factors |
2662 | float *A = f->A[blocktype]; |
2663 | |
2664 | // IMDCT algorithm from "The use of multirate filter banks for coding of high quality digital audio" |
2665 | // See notes about bugs in that paper in less-optimal implementation 'inverse_mdct_old' after this function. |
2666 | |
2667 | // kernel from paper |
2668 | |
2669 | |
2670 | // merged: |
2671 | // copy and reflect spectral data |
2672 | // step 0 |
2673 | |
2674 | // note that it turns out that the items added together during |
2675 | // this step are, in fact, being added to themselves (as reflected |
2676 | // by step 0). inexplicable inefficiency! this became obvious |
2677 | // once I combined the passes. |
2678 | |
2679 | // so there's a missing 'times 2' here (for adding X to itself). |
2680 | // this propogates through linearly to the end, where the numbers |
2681 | // are 1/2 too small, and need to be compensated for. |
2682 | |
2683 | { |
2684 | float *d,*e, *AA, *e_stop; |
2685 | d = &buf2[n2-2]; |
2686 | AA = A; |
2687 | e = &buffer[0]; |
2688 | e_stop = &buffer[n2]; |
2689 | while (e != e_stop) { |
2690 | d[1] = (e[0] * AA[0] - e[2]*AA[1]); |
2691 | d[0] = (e[0] * AA[1] + e[2]*AA[0]); |
2692 | d -= 2; |
2693 | AA += 2; |
2694 | e += 4; |
2695 | } |
2696 | |
2697 | e = &buffer[n2-3]; |
2698 | while (d >= buf2) { |
2699 | d[1] = (-e[2] * AA[0] - -e[0]*AA[1]); |
2700 | d[0] = (-e[2] * AA[1] + -e[0]*AA[0]); |
2701 | d -= 2; |
2702 | AA += 2; |
2703 | e -= 4; |
2704 | } |
2705 | } |
2706 | |
2707 | // now we use symbolic names for these, so that we can |
2708 | // possibly swap their meaning as we change which operations |
2709 | // are in place |
2710 | |
2711 | u = buffer; |
2712 | v = buf2; |
2713 | |
2714 | // step 2 (paper output is w, now u) |
2715 | // this could be in place, but the data ends up in the wrong |
2716 | // place... _somebody_'s got to swap it, so this is nominated |
2717 | { |
2718 | float *AA = &A[n2-8]; |
2719 | float *d0,*d1, *e0, *e1; |
2720 | |
2721 | e0 = &v[n4]; |
2722 | e1 = &v[0]; |
2723 | |
2724 | d0 = &u[n4]; |
2725 | d1 = &u[0]; |
2726 | |
2727 | while (AA >= A) { |
2728 | float v40_20, v41_21; |
2729 | |
2730 | v41_21 = e0[1] - e1[1]; |
2731 | v40_20 = e0[0] - e1[0]; |
2732 | d0[1] = e0[1] + e1[1]; |
2733 | d0[0] = e0[0] + e1[0]; |
2734 | d1[1] = v41_21*AA[4] - v40_20*AA[5]; |
2735 | d1[0] = v40_20*AA[4] + v41_21*AA[5]; |
2736 | |
2737 | v41_21 = e0[3] - e1[3]; |
2738 | v40_20 = e0[2] - e1[2]; |
2739 | d0[3] = e0[3] + e1[3]; |
2740 | d0[2] = e0[2] + e1[2]; |
2741 | d1[3] = v41_21*AA[0] - v40_20*AA[1]; |
2742 | d1[2] = v40_20*AA[0] + v41_21*AA[1]; |
2743 | |
2744 | AA -= 8; |
2745 | |
2746 | d0 += 4; |
2747 | d1 += 4; |
2748 | e0 += 4; |
2749 | e1 += 4; |
2750 | } |
2751 | } |
2752 | |
2753 | // step 3 |
2754 | ld = ilog(n) - 1; // ilog is off-by-one from normal definitions |
2755 | |
2756 | // optimized step 3: |
2757 | |
2758 | // the original step3 loop can be nested r inside s or s inside r; |
2759 | // it's written originally as s inside r, but this is dumb when r |
2760 | // iterates many times, and s few. So I have two copies of it and |
2761 | // switch between them halfway. |
2762 | |
2763 | // this is iteration 0 of step 3 |
2764 | imdct_step3_iter0_loop(n >> 4, u, n2-1-n4*0, -(n >> 3), A); |
2765 | imdct_step3_iter0_loop(n >> 4, u, n2-1-n4*1, -(n >> 3), A); |
2766 | |
2767 | // this is iteration 1 of step 3 |
2768 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*0, -(n >> 4), A, 16); |
2769 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*1, -(n >> 4), A, 16); |
2770 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*2, -(n >> 4), A, 16); |
2771 | imdct_step3_inner_r_loop(n >> 5, u, n2-1 - n8*3, -(n >> 4), A, 16); |
2772 | |
2773 | l=2; |
2774 | for (; l < (ld-3)>>1; ++l) { |
2775 | int k0 = n >> (l+2), k0_2 = k0>>1; |
2776 | int lim = 1 << (l+1); |
2777 | int i; |
2778 | for (i=0; i < lim; ++i) |
2779 | imdct_step3_inner_r_loop(n >> (l+4), u, n2-1 - k0*i, -k0_2, A, 1 << (l+3)); |
2780 | } |
2781 | |
2782 | for (; l < ld-6; ++l) { |
2783 | int k0 = n >> (l+2), k1 = 1 << (l+3), k0_2 = k0>>1; |
2784 | int rlim = n >> (l+6), r; |
2785 | int lim = 1 << (l+1); |
2786 | int i_off; |
2787 | float *A0 = A; |
2788 | i_off = n2-1; |
2789 | for (r=rlim; r > 0; --r) { |
2790 | imdct_step3_inner_s_loop(lim, u, i_off, -k0_2, A0, k1, k0); |
2791 | A0 += k1*4; |
2792 | i_off -= 8; |
2793 | } |
2794 | } |
2795 | |
2796 | // iterations with count: |
2797 | // ld-6,-5,-4 all interleaved together |
2798 | // the big win comes from getting rid of needless flops |
2799 | // due to the constants on pass 5 & 4 being all 1 and 0; |
2800 | // combining them to be simultaneous to improve cache made little difference |
2801 | imdct_step3_inner_s_loop_ld654(n >> 5, u, n2-1, A, n); |
2802 | |
2803 | // output is u |
2804 | |
2805 | // step 4, 5, and 6 |
2806 | // cannot be in-place because of step 5 |
2807 | { |
2808 | uint16 *bitrev = f->bit_reverse[blocktype]; |
2809 | // weirdly, I'd have thought reading sequentially and writing |
2810 | // erratically would have been better than vice-versa, but in |
2811 | // fact that's not what my testing showed. (That is, with |
2812 | // j = bitreverse(i), do you read i and write j, or read j and write i.) |
2813 | |
2814 | float *d0 = &v[n4-4]; |
2815 | float *d1 = &v[n2-4]; |
2816 | while (d0 >= v) { |
2817 | int k4; |
2818 | |
2819 | k4 = bitrev[0]; |
2820 | d1[3] = u[k4+0]; |
2821 | d1[2] = u[k4+1]; |
2822 | d0[3] = u[k4+2]; |
2823 | d0[2] = u[k4+3]; |
2824 | |
2825 | k4 = bitrev[1]; |
2826 | d1[1] = u[k4+0]; |
2827 | d1[0] = u[k4+1]; |
2828 | d0[1] = u[k4+2]; |
2829 | d0[0] = u[k4+3]; |
2830 | |
2831 | d0 -= 4; |
2832 | d1 -= 4; |
2833 | bitrev += 2; |
2834 | } |
2835 | } |
2836 | // (paper output is u, now v) |
2837 | |
2838 | |
2839 | // data must be in buf2 |
2840 | assert(v == buf2)((v == buf2) ? (void)0 : _assert("v == buf2", "src/siege/internal/stb/stb_vorbis.c" , 2840)); |
2841 | |
2842 | // step 7 (paper output is v, now v) |
2843 | // this is now in place |
2844 | { |
2845 | float *C(2 | 4 | 1) = f->C(2 | 4 | 1)[blocktype]; |
2846 | float *d, *e; |
2847 | |
2848 | d = v; |
2849 | e = v + n2 - 4; |
2850 | |
2851 | while (d < e) { |
2852 | float a02,a11,b0,b1,b2,b3; |
2853 | |
2854 | a02 = d[0] - e[2]; |
2855 | a11 = d[1] + e[3]; |
2856 | |
2857 | b0 = C(2 | 4 | 1)[1]*a02 + C(2 | 4 | 1)[0]*a11; |
2858 | b1 = C(2 | 4 | 1)[1]*a11 - C(2 | 4 | 1)[0]*a02; |
2859 | |
2860 | b2 = d[0] + e[ 2]; |
2861 | b3 = d[1] - e[ 3]; |
2862 | |
2863 | d[0] = b2 + b0; |
2864 | d[1] = b3 + b1; |
2865 | e[2] = b2 - b0; |
2866 | e[3] = b1 - b3; |
2867 | |
2868 | a02 = d[2] - e[0]; |
2869 | a11 = d[3] + e[1]; |
2870 | |
2871 | b0 = C(2 | 4 | 1)[3]*a02 + C(2 | 4 | 1)[2]*a11; |
2872 | b1 = C(2 | 4 | 1)[3]*a11 - C(2 | 4 | 1)[2]*a02; |
2873 | |
2874 | b2 = d[2] + e[ 0]; |
2875 | b3 = d[3] - e[ 1]; |
2876 | |
2877 | d[2] = b2 + b0; |
2878 | d[3] = b3 + b1; |
2879 | e[0] = b2 - b0; |
2880 | e[1] = b1 - b3; |
2881 | |
2882 | C(2 | 4 | 1) += 4; |
2883 | d += 4; |
2884 | e -= 4; |
2885 | } |
2886 | } |
2887 | |
2888 | // data must be in buf2 |
2889 | |
2890 | |
2891 | // step 8+decode (paper output is X, now buffer) |
2892 | // this generates pairs of data a la 8 and pushes them directly through |
2893 | // the decode kernel (pushing rather than pulling) to avoid having |
2894 | // to make another pass later |
2895 | |
2896 | // this cannot POSSIBLY be in place, so we refer to the buffers directly |
2897 | |
2898 | { |
2899 | float *d0,*d1,*d2,*d3; |
2900 | |
2901 | float *B = f->B[blocktype] + n2 - 8; |
2902 | float *e = buf2 + n2 - 8; |
2903 | d0 = &buffer[0]; |
2904 | d1 = &buffer[n2-4]; |
2905 | d2 = &buffer[n2]; |
2906 | d3 = &buffer[n-4]; |
2907 | while (e >= v) { |
2908 | float p0,p1,p2,p3; |
2909 | |
2910 | p3 = e[6]*B[7] - e[7]*B[6]; |
2911 | p2 = -e[6]*B[6] - e[7]*B[7]; |
2912 | |
2913 | d0[0] = p3; |
2914 | d1[3] = - p3; |
2915 | d2[0] = p2; |
2916 | d3[3] = p2; |
2917 | |
2918 | p1 = e[4]*B[5] - e[5]*B[4]; |
2919 | p0 = -e[4]*B[4] - e[5]*B[5]; |
2920 | |
2921 | d0[1] = p1; |
2922 | d1[2] = - p1; |
2923 | d2[1] = p0; |
2924 | d3[2] = p0; |
2925 | |
2926 | p3 = e[2]*B[3] - e[3]*B[2]; |
2927 | p2 = -e[2]*B[2] - e[3]*B[3]; |
2928 | |
2929 | d0[2] = p3; |
2930 | d1[1] = - p3; |
2931 | d2[2] = p2; |
2932 | d3[1] = p2; |
2933 | |
2934 | p1 = e[0]*B[1] - e[1]*B[0]; |
2935 | p0 = -e[0]*B[0] - e[1]*B[1]; |
2936 | |
2937 | d0[3] = p1; |
2938 | d1[0] = - p1; |
2939 | d2[3] = p0; |
2940 | d3[0] = p0; |
2941 | |
2942 | B -= 8; |
2943 | e -= 8; |
2944 | d0 += 4; |
2945 | d2 += 4; |
2946 | d1 -= 4; |
2947 | d3 -= 4; |
2948 | } |
2949 | } |
2950 | |
2951 | temp_alloc_restore(f,save_point)((f)->temp_offset = (save_point)); |
2952 | } |
2953 | |
2954 | #if 0 |
2955 | // this is the original version of the above code, if you want to optimize it from scratch |
2956 | void inverse_mdct_naive(float *buffer, int n) |
2957 | { |
2958 | float s; |
2959 | float A[1 << 12], B[1 << 12], C(2 | 4 | 1)[1 << 11]; |
2960 | int i,k,k2,k4, n2 = n >> 1, n4 = n >> 2, n8 = n >> 3, l; |
2961 | int n3_4 = n - n4, ld; |
2962 | // how can they claim this only uses N words?! |
2963 | // oh, because they're only used sparsely, whoops |
2964 | float u[1 << 13], X[1 << 13], v[1 << 13], w[1 << 13]; |
2965 | // set up twiddle factors |
2966 | |
2967 | for (k=k2=0; k < n4; ++k,k2+=2) { |
2968 | A[k2 ] = (float) cos(4*k*M_PI3.14159265358979323846/n); |
2969 | A[k2+1] = (float) -sin(4*k*M_PI3.14159265358979323846/n); |
2970 | B[k2 ] = (float) cos((k2+1)*M_PI3.14159265358979323846/n/2); |
2971 | B[k2+1] = (float) sin((k2+1)*M_PI3.14159265358979323846/n/2); |
2972 | } |
2973 | for (k=k2=0; k < n8; ++k,k2+=2) { |
2974 | C(2 | 4 | 1)[k2 ] = (float) cos(2*(k2+1)*M_PI3.14159265358979323846/n); |
2975 | C(2 | 4 | 1)[k2+1] = (float) -sin(2*(k2+1)*M_PI3.14159265358979323846/n); |
2976 | } |
2977 | |
2978 | // IMDCT algorithm from "The use of multirate filter banks for coding of high quality digital audio" |
2979 | // Note there are bugs in that pseudocode, presumably due to them attempting |
2980 | // to rename the arrays nicely rather than representing the way their actual |
2981 | // implementation bounces buffers back and forth. As a result, even in the |
2982 | // "some formulars corrected" version, a direct implementation fails. These |
2983 | // are noted below as "paper bug". |
2984 | |
2985 | // copy and reflect spectral data |
2986 | for (k=0; k < n2; ++k) u[k] = buffer[k]; |
2987 | for ( ; k < n ; ++k) u[k] = -buffer[n - k - 1]; |
2988 | // kernel from paper |
2989 | // step 1 |
2990 | for (k=k2=k4=0; k < n4; k+=1, k2+=2, k4+=4) { |
2991 | v[n-k4-1] = (u[k4] - u[n-k4-1]) * A[k2] - (u[k4+2] - u[n-k4-3])*A[k2+1]; |
2992 | v[n-k4-3] = (u[k4] - u[n-k4-1]) * A[k2+1] + (u[k4+2] - u[n-k4-3])*A[k2]; |
2993 | } |
2994 | // step 2 |
2995 | for (k=k4=0; k < n8; k+=1, k4+=4) { |
2996 | w[n2+3+k4] = v[n2+3+k4] + v[k4+3]; |
2997 | w[n2+1+k4] = v[n2+1+k4] + v[k4+1]; |
2998 | w[k4+3] = (v[n2+3+k4] - v[k4+3])*A[n2-4-k4] - (v[n2+1+k4]-v[k4+1])*A[n2-3-k4]; |
2999 | w[k4+1] = (v[n2+1+k4] - v[k4+1])*A[n2-4-k4] + (v[n2+3+k4]-v[k4+3])*A[n2-3-k4]; |
3000 | } |
3001 | // step 3 |
3002 | ld = ilog(n) - 1; // ilog is off-by-one from normal definitions |
3003 | for (l=0; l < ld-3; ++l) { |
3004 | int k0 = n >> (l+2), k1 = 1 << (l+3); |
3005 | int rlim = n >> (l+4), r4, r; |
3006 | int s2lim = 1 << (l+2), s2; |
3007 | for (r=r4=0; r < rlim; r4+=4,++r) { |
3008 | for (s2=0; s2 < s2lim; s2+=2) { |
3009 | u[n-1-k0*s2-r4] = w[n-1-k0*s2-r4] + w[n-1-k0*(s2+1)-r4]; |
3010 | u[n-3-k0*s2-r4] = w[n-3-k0*s2-r4] + w[n-3-k0*(s2+1)-r4]; |
3011 | u[n-1-k0*(s2+1)-r4] = (w[n-1-k0*s2-r4] - w[n-1-k0*(s2+1)-r4]) * A[r*k1] |
3012 | - (w[n-3-k0*s2-r4] - w[n-3-k0*(s2+1)-r4]) * A[r*k1+1]; |
3013 | u[n-3-k0*(s2+1)-r4] = (w[n-3-k0*s2-r4] - w[n-3-k0*(s2+1)-r4]) * A[r*k1] |
3014 | + (w[n-1-k0*s2-r4] - w[n-1-k0*(s2+1)-r4]) * A[r*k1+1]; |
3015 | } |
3016 | } |
3017 | if (l+1 < ld-3) { |
3018 | // paper bug: ping-ponging of u&w here is omitted |
3019 | memcpy(w, u, sizeof(u)); |
3020 | } |
3021 | } |
3022 | |
3023 | // step 4 |
3024 | for (i=0; i < n8; ++i) { |
3025 | int j = bit_reverse(i) >> (32-ld+3); |
3026 | assert(j < n8)((j < n8) ? (void)0 : _assert("j < n8", "src/siege/internal/stb/stb_vorbis.c" , 3026)); |
3027 | if (i == j) { |
3028 | // paper bug: original code probably swapped in place; if copying, |
3029 | // need to directly copy in this case |
3030 | int i8 = i << 3; |
3031 | v[i8+1] = u[i8+1]; |
3032 | v[i8+3] = u[i8+3]; |
3033 | v[i8+5] = u[i8+5]; |
3034 | v[i8+7] = u[i8+7]; |
3035 | } else if (i < j) { |
3036 | int i8 = i << 3, j8 = j << 3; |
3037 | v[j8+1] = u[i8+1], v[i8+1] = u[j8 + 1]; |
3038 | v[j8+3] = u[i8+3], v[i8+3] = u[j8 + 3]; |
3039 | v[j8+5] = u[i8+5], v[i8+5] = u[j8 + 5]; |
3040 | v[j8+7] = u[i8+7], v[i8+7] = u[j8 + 7]; |
3041 | } |
3042 | } |
3043 | // step 5 |
3044 | for (k=0; k < n2; ++k) { |
3045 | w[k] = v[k*2+1]; |
3046 | } |
3047 | // step 6 |
3048 | for (k=k2=k4=0; k < n8; ++k, k2 += 2, k4 += 4) { |
3049 | u[n-1-k2] = w[k4]; |
3050 | u[n-2-k2] = w[k4+1]; |
3051 | u[n3_4 - 1 - k2] = w[k4+2]; |
3052 | u[n3_4 - 2 - k2] = w[k4+3]; |
3053 | } |
3054 | // step 7 |
3055 | for (k=k2=0; k < n8; ++k, k2 += 2) { |
3056 | v[n2 + k2 ] = ( u[n2 + k2] + u[n-2-k2] + C(2 | 4 | 1)[k2+1]*(u[n2+k2]-u[n-2-k2]) + C(2 | 4 | 1)[k2]*(u[n2+k2+1]+u[n-2-k2+1]))/2; |
3057 | v[n-2 - k2] = ( u[n2 + k2] + u[n-2-k2] - C(2 | 4 | 1)[k2+1]*(u[n2+k2]-u[n-2-k2]) - C(2 | 4 | 1)[k2]*(u[n2+k2+1]+u[n-2-k2+1]))/2; |
3058 | v[n2+1+ k2] = ( u[n2+1+k2] - u[n-1-k2] + C(2 | 4 | 1)[k2+1]*(u[n2+1+k2]+u[n-1-k2]) - C(2 | 4 | 1)[k2]*(u[n2+k2]-u[n-2-k2]))/2; |
3059 | v[n-1 - k2] = (-u[n2+1+k2] + u[n-1-k2] + C(2 | 4 | 1)[k2+1]*(u[n2+1+k2]+u[n-1-k2]) - C(2 | 4 | 1)[k2]*(u[n2+k2]-u[n-2-k2]))/2; |
3060 | } |
3061 | // step 8 |
3062 | for (k=k2=0; k < n4; ++k,k2 += 2) { |
3063 | X[k] = v[k2+n2]*B[k2 ] + v[k2+1+n2]*B[k2+1]; |
3064 | X[n2-1-k] = v[k2+n2]*B[k2+1] - v[k2+1+n2]*B[k2 ]; |
3065 | } |
3066 | |
3067 | // decode kernel to output |
3068 | // determined the following value experimentally |
3069 | // (by first figuring out what made inverse_mdct_slow work); then matching that here |
3070 | // (probably vorbis encoder premultiplies by n or n/2, to save it on the decoder?) |
3071 | s = 0.5; // theoretically would be n4 |
3072 | |
3073 | // [[[ note! the s value of 0.5 is compensated for by the B[] in the current code, |
3074 | // so it needs to use the "old" B values to behave correctly, or else |
3075 | // set s to 1.0 ]]] |
3076 | for (i=0; i < n4 ; ++i) buffer[i] = s * X[i+n4]; |
3077 | for ( ; i < n3_4; ++i) buffer[i] = -s * X[n3_4 - i - 1]; |
3078 | for ( ; i < n ; ++i) buffer[i] = -s * X[i - n3_4]; |
3079 | } |
3080 | #endif |
3081 | |
3082 | static float *get_window(vorb *f, int len) |
3083 | { |
3084 | len <<= 1; |
3085 | if (len == f->blocksize_0) return f->window[0]; |
3086 | if (len == f->blocksize_1) return f->window[1]; |
3087 | assert(0)((0) ? (void)0 : _assert("0", "src/siege/internal/stb/stb_vorbis.c" , 3087)); |
3088 | return NULL((void*)0); |
3089 | } |
3090 | |
3091 | #ifndef STB_VORBIS_NO_DEFER_FLOOR |
3092 | typedef int16 YTYPE; |
3093 | #else |
3094 | typedef int YTYPE; |
3095 | #endif |
3096 | static int do_floor(vorb *f, Mapping *map, int i, int n, float *target, YTYPE *finalY, uint8 *step2_flag) |
3097 | { |
3098 | int n2 = n >> 1; |
3099 | int s = map->chan[i].mux, floor; |
3100 | floor = map->submap_floor[s]; |
3101 | if (f->floor_types[floor] == 0) { |
3102 | return error(f, VORBIS_invalid_stream); |
3103 | } else { |
3104 | Floor1 *g = &f->floor_config[floor].floor1; |
3105 | int j,q; |
3106 | int lx = 0, ly = finalY[0] * g->floor1_multiplier; |
3107 | for (q=1; q < g->values; ++q) { |
3108 | j = g->sorted_order[q]; |
3109 | #ifndef STB_VORBIS_NO_DEFER_FLOOR |
3110 | if (finalY[j] >= 0) |
3111 | #else |
3112 | if (step2_flag[j]) |
3113 | #endif |
3114 | { |
3115 | int hy = finalY[j] * g->floor1_multiplier; |
3116 | int hx = g->Xlist[j]; |
3117 | draw_line(target, lx,ly, hx,hy, n2); |
3118 | lx = hx, ly = hy; |
3119 | } |
3120 | } |
3121 | if (lx < n2) |
3122 | // optimization of: draw_line(target, lx,ly, n,ly, n2); |
3123 | for (j=lx; j < n2; ++j) |
3124 | LINE_OP(target[j], inverse_db_table[ly])target[j] *= inverse_db_table[ly]; |
3125 | } |
3126 | return TRUE1; |
3127 | } |
3128 | |
3129 | static int vorbis_decode_initial(vorb *f, int *p_left_start, int *p_left_end, int *p_right_start, int *p_right_end, int *mode) |
3130 | { |
3131 | Mode *m; |
3132 | int i, n, prev, next, window_center; |
3133 | f->channel_buffer_start = f->channel_buffer_end = 0; |
3134 | |
3135 | retry: |
3136 | if (f->eof) return FALSE0; |
3137 | if (!maybe_start_packet(f)) |
3138 | return FALSE0; |
3139 | // check packet type |
3140 | if (get_bits(f,1) != 0) { |
3141 | if (IS_PUSH_MODE(f)((f)->push_mode)) |
3142 | return error(f,VORBIS_bad_packet_type); |
3143 | while (EOP(-1) != get8_packet(f)); |
3144 | goto retry; |
3145 | } |
3146 | |
3147 | if (f->alloc.alloc_buffer) |
3148 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3148)); |
3149 | |
3150 | i = get_bits(f, ilog(f->mode_count-1)); |
3151 | if (i == EOP(-1)) return FALSE0; |
3152 | if (i >= f->mode_count) return FALSE0; |
3153 | *mode = i; |
3154 | m = f->mode_config + i; |
3155 | if (m->blockflag) { |
3156 | n = f->blocksize_1; |
3157 | prev = get_bits(f,1); |
3158 | next = get_bits(f,1); |
3159 | } else { |
3160 | prev = next = 0; |
3161 | n = f->blocksize_0; |
3162 | } |
3163 | |
3164 | // WINDOWING |
3165 | |
3166 | window_center = n >> 1; |
3167 | if (m->blockflag && !prev) { |
3168 | *p_left_start = (n - f->blocksize_0) >> 2; |
3169 | *p_left_end = (n + f->blocksize_0) >> 2; |
3170 | } else { |
3171 | *p_left_start = 0; |
3172 | *p_left_end = window_center; |
3173 | } |
3174 | if (m->blockflag && !next) { |
3175 | *p_right_start = (n*3 - f->blocksize_0) >> 2; |
3176 | *p_right_end = (n*3 + f->blocksize_0) >> 2; |
3177 | } else { |
3178 | *p_right_start = window_center; |
3179 | *p_right_end = n; |
3180 | } |
3181 | return TRUE1; |
3182 | } |
3183 | |
3184 | static int vorbis_decode_packet_rest(vorb *f, int *len, Mode *m, int left_start, int left_end, int right_start, int right_end, int *p_left) |
3185 | { |
3186 | Mapping *map; |
3187 | int i,j,k,n,n2; |
3188 | int zero_channel[256]; |
3189 | int really_zero_channel[256]; |
3190 | int window_center; |
3191 | |
3192 | // WINDOWING |
3193 | |
3194 | n = f->blocksize[m->blockflag]; |
3195 | window_center = n >> 1; |
3196 | (void)window_center; |
3197 | |
3198 | map = &f->mapping[m->mapping]; |
3199 | |
3200 | // FLOORS |
3201 | n2 = n >> 1; |
3202 | |
3203 | stb_prof(1)(void)0; |
3204 | for (i=0; i < f->channels; ++i) { |
3205 | int s = map->chan[i].mux, floor; |
3206 | zero_channel[i] = FALSE0; |
3207 | floor = map->submap_floor[s]; |
3208 | if (f->floor_types[floor] == 0) { |
3209 | return error(f, VORBIS_invalid_stream); |
3210 | } else { |
3211 | Floor1 *g = &f->floor_config[floor].floor1; |
3212 | if (get_bits(f, 1)) { |
3213 | short *finalY; |
3214 | uint8 step2_flag[256]; |
3215 | static int range_list[4] = { 256, 128, 86, 64 }; |
3216 | int range = range_list[g->floor1_multiplier-1]; |
3217 | int offset = 2; |
3218 | finalY = f->finalY[i]; |
3219 | finalY[0] = get_bits(f, ilog(range)-1); |
3220 | finalY[1] = get_bits(f, ilog(range)-1); |
3221 | for (j=0; j < g->partitions; ++j) { |
3222 | int pclass = g->partition_class_list[j]; |
3223 | int cdim = g->class_dimensions[pclass]; |
3224 | int cbits = g->class_subclasses[pclass]; |
3225 | int csub = (1 << cbits)-1; |
3226 | int cval = 0; |
3227 | if (cbits) { |
3228 | Codebook *c = f->codebooks + g->class_masterbooks[pclass]; |
3229 | DECODE(cval,f,c)if (f->valid_bits < 10) prep_huffman(f); cval = f->acc & ((1 << 10) - 1); cval = c->fast_huffman[cval] ; if (cval >= 0) { int n = c->codeword_lengths[cval]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; cval = -1; } } else { cval = codebook_decode_scalar_raw(f,c); } if (c->sparse) cval = c ->sorted_values[cval];; |
3230 | } |
3231 | for (k=0; k < cdim; ++k) { |
3232 | int book = g->subclass_books[pclass][cval & csub]; |
3233 | cval = cval >> cbits; |
3234 | if (book >= 0) { |
3235 | int temp; |
3236 | Codebook *c = f->codebooks + book; |
3237 | DECODE(temp,f,c)if (f->valid_bits < 10) prep_huffman(f); temp = f->acc & ((1 << 10) - 1); temp = c->fast_huffman[temp] ; if (temp >= 0) { int n = c->codeword_lengths[temp]; f ->acc >>= n; f->valid_bits -= n; if (f->valid_bits < 0) { f->valid_bits = 0; temp = -1; } } else { temp = codebook_decode_scalar_raw(f,c); } if (c->sparse) temp = c ->sorted_values[temp];; |
3238 | finalY[offset++] = temp; |
3239 | } else |
3240 | finalY[offset++] = 0; |
3241 | } |
3242 | } |
3243 | if (f->valid_bits == INVALID_BITS(-1)) goto error; // behavior according to spec |
3244 | step2_flag[0] = step2_flag[1] = 1; |
3245 | for (j=2; j < g->values; ++j) { |
3246 | int low, high, pred, highroom, lowroom, room, val; |
3247 | low = g->neighbors[j][0]; |
3248 | high = g->neighbors[j][1]; |
3249 | //neighbors(g->Xlist, j, &low, &high); |
3250 | pred = predict_point(g->Xlist[j], g->Xlist[low], g->Xlist[high], finalY[low], finalY[high]); |
3251 | val = finalY[j]; |
3252 | highroom = range - pred; |
3253 | lowroom = pred; |
3254 | if (highroom < lowroom) |
3255 | room = highroom * 2; |
3256 | else |
3257 | room = lowroom * 2; |
3258 | if (val) { |
3259 | step2_flag[low] = step2_flag[high] = 1; |
3260 | step2_flag[j] = 1; |
3261 | if (val >= room) |
3262 | if (highroom > lowroom) |
3263 | finalY[j] = val - lowroom + pred; |
3264 | else |
3265 | finalY[j] = pred - val + highroom - 1; |
3266 | else |
3267 | if (val & 1) |
3268 | finalY[j] = pred - ((val+1)>>1); |
3269 | else |
3270 | finalY[j] = pred + (val>>1); |
3271 | } else { |
3272 | step2_flag[j] = 0; |
3273 | finalY[j] = pred; |
3274 | } |
3275 | } |
3276 | |
3277 | #ifdef STB_VORBIS_NO_DEFER_FLOOR |
3278 | do_floor(f, map, i, n, f->floor_buffers[i], finalY, step2_flag); |
3279 | #else |
3280 | // defer final floor computation until _after_ residue |
3281 | for (j=0; j < g->values; ++j) { |
3282 | if (!step2_flag[j]) |
3283 | finalY[j] = -1; |
3284 | } |
3285 | #endif |
3286 | } else { |
3287 | error: |
3288 | zero_channel[i] = TRUE1; |
3289 | } |
3290 | // So we just defer everything else to later |
3291 | |
3292 | // at this point we've decoded the floor into buffer |
3293 | } |
3294 | } |
3295 | stb_prof(0)(void)0; |
3296 | // at this point we've decoded all floors |
3297 | |
3298 | if (f->alloc.alloc_buffer) |
3299 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3299)); |
3300 | |
3301 | // re-enable coupled channels if necessary |
3302 | memcpy(really_zero_channel, zero_channel, sizeof(really_zero_channel[0]) * f->channels); |
3303 | for (i=0; i < map->coupling_steps; ++i) |
3304 | if (!zero_channel[map->chan[i].magnitude] || !zero_channel[map->chan[i].angle]) { |
3305 | zero_channel[map->chan[i].magnitude] = zero_channel[map->chan[i].angle] = FALSE0; |
3306 | } |
3307 | |
3308 | // RESIDUE DECODE |
3309 | for (i=0; i < map->submaps; ++i) { |
3310 | float *residue_buffers[STB_VORBIS_MAX_CHANNELS16]; |
3311 | int r,t; |
3312 | uint8 do_not_decode[256]; |
3313 | int ch = 0; |
3314 | for (j=0; j < f->channels; ++j) { |
3315 | if (map->chan[j].mux == i) { |
3316 | if (zero_channel[j]) { |
3317 | do_not_decode[ch] = TRUE1; |
3318 | residue_buffers[ch] = NULL((void*)0); |
3319 | } else { |
3320 | do_not_decode[ch] = FALSE0; |
3321 | residue_buffers[ch] = f->channel_buffers[j]; |
3322 | } |
3323 | ++ch; |
3324 | } |
3325 | } |
3326 | r = map->submap_residue[i]; |
3327 | t = f->residue_types[r]; |
3328 | (void)t; |
3329 | decode_residue(f, residue_buffers, ch, n2, r, do_not_decode); |
3330 | } |
3331 | |
3332 | if (f->alloc.alloc_buffer) |
3333 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3333)); |
3334 | |
3335 | // INVERSE COUPLING |
3336 | stb_prof(14)(void)0; |
3337 | for (i = map->coupling_steps-1; i >= 0; --i) { |
3338 | int n2 = n >> 1; |
3339 | float *m = f->channel_buffers[map->chan[i].magnitude]; |
3340 | float *a = f->channel_buffers[map->chan[i].angle ]; |
3341 | for (j=0; j < n2; ++j) { |
3342 | float a2,m2; |
3343 | if (m[j] > 0) |
3344 | if (a[j] > 0) |
3345 | m2 = m[j], a2 = m[j] - a[j]; |
3346 | else |
3347 | a2 = m[j], m2 = m[j] + a[j]; |
3348 | else |
3349 | if (a[j] > 0) |
3350 | m2 = m[j], a2 = m[j] + a[j]; |
3351 | else |
3352 | a2 = m[j], m2 = m[j] - a[j]; |
3353 | m[j] = m2; |
3354 | a[j] = a2; |
3355 | } |
3356 | } |
3357 | |
3358 | // finish decoding the floors |
3359 | #ifndef STB_VORBIS_NO_DEFER_FLOOR |
3360 | stb_prof(15)(void)0; |
3361 | for (i=0; i < f->channels; ++i) { |
3362 | if (really_zero_channel[i]) { |
3363 | memset(f->channel_buffers[i], 0, sizeof(*f->channel_buffers[i]) * n2); |
3364 | } else { |
3365 | do_floor(f, map, i, n, f->channel_buffers[i], f->finalY[i], NULL((void*)0)); |
3366 | } |
3367 | } |
3368 | #else |
3369 | for (i=0; i < f->channels; ++i) { |
3370 | if (really_zero_channel[i]) { |
3371 | memset(f->channel_buffers[i], 0, sizeof(*f->channel_buffers[i]) * n2); |
3372 | } else { |
3373 | for (j=0; j < n2; ++j) |
3374 | f->channel_buffers[i][j] *= f->floor_buffers[i][j]; |
3375 | } |
3376 | } |
3377 | #endif |
3378 | |
3379 | // INVERSE MDCT |
3380 | stb_prof(16)(void)0; |
3381 | for (i=0; i < f->channels; ++i) |
3382 | inverse_mdct(f->channel_buffers[i], n, f, m->blockflag); |
3383 | stb_prof(0)(void)0; |
3384 | |
3385 | // this shouldn't be necessary, unless we exited on an error |
3386 | // and want to flush to get to the next packet |
3387 | flush_packet(f); |
3388 | |
3389 | if (f->first_decode) { |
3390 | // assume we start so first non-discarded sample is sample 0 |
3391 | // this isn't to spec, but spec would require us to read ahead |
3392 | // and decode the size of all current frames--could be done, |
3393 | // but presumably it's not a commonly used feature |
3394 | f->current_loc = -n2; // start of first frame is positioned for discard |
3395 | // we might have to discard samples "from" the next frame too, |
3396 | // if we're lapping a large block then a small at the start? |
3397 | f->discard_samples_deferred = n - right_end; |
3398 | f->current_loc_valid = TRUE1; |
3399 | f->first_decode = FALSE0; |
3400 | } else if (f->discard_samples_deferred) { |
3401 | left_start += f->discard_samples_deferred; |
3402 | *p_left = left_start; |
3403 | f->discard_samples_deferred = 0; |
3404 | } else if (f->previous_length == 0 && f->current_loc_valid) { |
3405 | // we're recovering from a seek... that means we're going to discard |
3406 | // the samples from this packet even though we know our position from |
3407 | // the last page header, so we need to update the position based on |
3408 | // the discarded samples here |
3409 | // but wait, the code below is going to add this in itself even |
3410 | // on a discard, so we don't need to do it here... |
3411 | } |
3412 | |
3413 | // check if we have ogg information about the sample # for this packet |
3414 | if (f->last_seg_which == f->end_seg_with_known_loc) { |
3415 | // if we have a valid current loc, and this is final: |
3416 | if (f->current_loc_valid && (f->page_flag & PAGEFLAG_last_page4)) { |
3417 | uint32 current_end = f->known_loc_for_packet - (n-right_end); |
3418 | // then let's infer the size of the (probably) short final frame |
3419 | if (current_end < f->current_loc + right_end) { |
3420 | if (current_end < f->current_loc) { |
3421 | // negative truncation, that's impossible! |
3422 | *len = 0; |
3423 | } else { |
3424 | *len = current_end - f->current_loc; |
3425 | } |
3426 | *len += left_start; |
3427 | f->current_loc += *len; |
3428 | return TRUE1; |
3429 | } |
3430 | } |
3431 | // otherwise, just set our sample loc |
3432 | // guess that the ogg granule pos refers to the _middle_ of the |
3433 | // last frame? |
3434 | // set f->current_loc to the position of left_start |
3435 | f->current_loc = f->known_loc_for_packet - (n2-left_start); |
3436 | f->current_loc_valid = TRUE1; |
3437 | } |
3438 | if (f->current_loc_valid) |
3439 | f->current_loc += (right_start - left_start); |
3440 | |
3441 | if (f->alloc.alloc_buffer) |
3442 | assert(f->alloc.alloc_buffer_length_in_bytes == f->temp_offset)((f->alloc.alloc_buffer_length_in_bytes == f->temp_offset ) ? (void)0 : _assert("f->alloc.alloc_buffer_length_in_bytes == f->temp_offset" , "src/siege/internal/stb/stb_vorbis.c", 3442)); |
3443 | *len = right_end; // ignore samples after the window goes to 0 |
3444 | return TRUE1; |
3445 | } |
3446 | |
3447 | static int vorbis_decode_packet(vorb *f, int *len, int *p_left, int *p_right) |
3448 | { |
3449 | int mode, left_end, right_end; |
3450 | if (!vorbis_decode_initial(f, p_left, &left_end, p_right, &right_end, &mode)) return 0; |
3451 | return vorbis_decode_packet_rest(f, len, f->mode_config + mode, *p_left, left_end, *p_right, right_end, p_left); |
3452 | } |
3453 | |
3454 | static int vorbis_finish_frame(stb_vorbis *f, int len, int left, int right) |
3455 | { |
3456 | int prev,i,j; |
3457 | // we use right&left (the start of the right- and left-window sin()-regions) |
3458 | // to determine how much to return, rather than inferring from the rules |
3459 | // (same result, clearer code); 'left' indicates where our sin() window |
3460 | // starts, therefore where the previous window's right edge starts, and |
3461 | // therefore where to start mixing from the previous buffer. 'right' |
3462 | // indicates where our sin() ending-window starts, therefore that's where |
3463 | // we start saving, and where our returned-data ends. |
3464 | |
3465 | // mixin from previous window |
3466 | if (f->previous_length) { |
3467 | int i,j, n = f->previous_length; |
3468 | float *w = get_window(f, n); |
3469 | for (i=0; i < f->channels; ++i) { |
3470 | for (j=0; j < n; ++j) |
3471 | f->channel_buffers[i][left+j] = |
3472 | f->channel_buffers[i][left+j]*w[ j] + |
3473 | f->previous_window[i][ j]*w[n-1-j]; |
3474 | } |
3475 | } |
3476 | |
3477 | prev = f->previous_length; |
3478 | |
3479 | // last half of this data becomes previous window |
3480 | f->previous_length = len - right; |
3481 | |
3482 | // @OPTIMIZE: could avoid this copy by double-buffering the |
3483 | // output (flipping previous_window with channel_buffers), but |
3484 | // then previous_window would have to be 2x as large, and |
3485 | // channel_buffers couldn't be temp mem (although they're NOT |
3486 | // currently temp mem, they could be (unless we want to level |
3487 | // performance by spreading out the computation)) |
3488 | for (i=0; i < f->channels; ++i) |
3489 | for (j=0; right+j < len; ++j) |
3490 | f->previous_window[i][j] = f->channel_buffers[i][right+j]; |
3491 | |
3492 | if (!prev) |
3493 | // there was no previous packet, so this data isn't valid... |
3494 | // this isn't entirely true, only the would-have-overlapped data |
3495 | // isn't valid, but this seems to be what the spec requires |
3496 | return 0; |
3497 | |
3498 | // truncate a short frame |
3499 | if (len < right) right = len; |
3500 | |
3501 | f->samples_output += right-left; |
3502 | |
3503 | return right - left; |
3504 | } |
3505 | |
3506 | static void vorbis_pump_first_frame(stb_vorbis *f) |
3507 | { |
3508 | int len, right, left; |
3509 | if (vorbis_decode_packet(f, &len, &left, &right)) |
3510 | vorbis_finish_frame(f, len, left, right); |
3511 | } |
3512 | |
3513 | #ifndef STB_VORBIS_NO_PUSHDATA_API |
3514 | static int is_whole_packet_present(stb_vorbis *f, int end_page) |
3515 | { |
3516 | // make sure that we have the packet available before continuing... |
3517 | // this requires a full ogg parse, but we know we can fetch from f->stream |
3518 | |
3519 | // instead of coding this out explicitly, we could save the current read state, |
3520 | // read the next packet with get8() until end-of-packet, check f->eof, then |
3521 | // reset the state? but that would be slower, esp. since we'd have over 256 bytes |
3522 | // of state to restore (primarily the page segment table) |
3523 | |
3524 | int s = f->next_seg, first = TRUE1; |
3525 | uint8 *p = f->stream; |
3526 | |
3527 | if (s != -1) { // if we're not starting the packet with a 'continue on next page' flag |
3528 | for (; s < f->segment_count; ++s) { |
3529 | p += f->segments[s]; |
3530 | if (f->segments[s] < 255) // stop at first short segment |
3531 | break; |
3532 | } |
3533 | // either this continues, or it ends it... |
3534 | if (end_page) |
3535 | if (s < f->segment_count-1) return error(f, VORBIS_invalid_stream); |
3536 | if (s == f->segment_count) |
3537 | s = -1; // set 'crosses page' flag |
3538 | if (p > f->stream_end) return error(f, VORBIS_need_more_data); |
3539 | first = FALSE0; |
3540 | } |
3541 | for (; s == -1;) { |
3542 | uint8 *q; |
3543 | int n; |
3544 | |
3545 | // check that we have the page header ready |
3546 | if (p + 26 >= f->stream_end) return error(f, VORBIS_need_more_data); |
3547 | // validate the page |
3548 | if (memcmp(p, ogg_page_header, 4)) return error(f, VORBIS_invalid_stream); |
3549 | if (p[4] != 0) return error(f, VORBIS_invalid_stream); |
3550 | if (first) { // the first segment must NOT have 'continued_packet', later ones MUST |
3551 | if (f->previous_length) |
3552 | if ((p[5] & PAGEFLAG_continued_packet1)) return error(f, VORBIS_invalid_stream); |
3553 | // if no previous length, we're resynching, so we can come in on a continued-packet, |
3554 | // which we'll just drop |
3555 | } else { |
3556 | if (!(p[5] & PAGEFLAG_continued_packet1)) return error(f, VORBIS_invalid_stream); |
3557 | } |
3558 | n = p[26]; // segment counts |
3559 | q = p+27; // q points to segment table |
3560 | p = q + n; // advance past header |
3561 | // make sure we've read the segment table |
3562 | if (p > f->stream_end) return error(f, VORBIS_need_more_data); |
3563 | for (s=0; s < n; ++s) { |
3564 | p += q[s]; |
3565 | if (q[s] < 255) |
3566 | break; |
3567 | } |
3568 | if (end_page) |
3569 | if (s < n-1) return error(f, VORBIS_invalid_stream); |
3570 | if (s == f->segment_count) |
3571 | s = -1; // set 'crosses page' flag |
3572 | if (p > f->stream_end) return error(f, VORBIS_need_more_data); |
3573 | first = FALSE0; |
3574 | } |
3575 | return TRUE1; |
3576 | } |
3577 | #endif // !STB_VORBIS_NO_PUSHDATA_API |
3578 | |
3579 | static int start_decoder(vorb *f) |
3580 | { |
3581 | uint8 header[6], x,y; |
3582 | int len,i,j,k, max_submaps = 0; |
3583 | int longest_floorlist=0; |
3584 | |
3585 | // first page, first packet |
3586 | |
3587 | if (!start_page(f)) return FALSE0; |
3588 | // validate page flag |
3589 | if (!(f->page_flag & PAGEFLAG_first_page2)) return error(f, VORBIS_invalid_first_page); |
3590 | if (f->page_flag & PAGEFLAG_last_page4) return error(f, VORBIS_invalid_first_page); |
3591 | if (f->page_flag & PAGEFLAG_continued_packet1) return error(f, VORBIS_invalid_first_page); |
3592 | // check for expected packet length |
3593 | if (f->segment_count != 1) return error(f, VORBIS_invalid_first_page); |
3594 | if (f->segments[0] != 30) return error(f, VORBIS_invalid_first_page); |
3595 | // read packet |
3596 | // check packet header |
3597 | if (get8(f) != VORBIS_packet_id) return error(f, VORBIS_invalid_first_page); |
3598 | if (!getn(f, header, 6)) return error(f, VORBIS_unexpected_eof); |
3599 | if (!vorbis_validate(header)) return error(f, VORBIS_invalid_first_page); |
3600 | // vorbis_version |
3601 | if (get32(f) != 0) return error(f, VORBIS_invalid_first_page); |
3602 | f->channels = get8(f); if (!f->channels) return error(f, VORBIS_invalid_first_page); |
3603 | if (f->channels > STB_VORBIS_MAX_CHANNELS16) return error(f, VORBIS_too_many_channels); |
3604 | f->sample_rate = get32(f); if (!f->sample_rate) return error(f, VORBIS_invalid_first_page); |
3605 | get32(f); // bitrate_maximum |
3606 | get32(f); // bitrate_nominal |
3607 | get32(f); // bitrate_minimum |
3608 | x = get8(f); |
3609 | { int log0,log1; |
3610 | log0 = x & 15; |
3611 | log1 = x >> 4; |
3612 | f->blocksize_0 = 1 << log0; |
3613 | f->blocksize_1 = 1 << log1; |
3614 | if (log0 < 6 || log0 > 13) return error(f, VORBIS_invalid_setup); |
3615 | if (log1 < 6 || log1 > 13) return error(f, VORBIS_invalid_setup); |
3616 | if (log0 > log1) return error(f, VORBIS_invalid_setup); |
3617 | } |
3618 | |
3619 | // framing_flag |
3620 | x = get8(f); |
3621 | if (!(x & 1)) return error(f, VORBIS_invalid_first_page); |
3622 | |
3623 | // second packet! |
3624 | if (!start_page(f)) return FALSE0; |
3625 | |
3626 | if (!start_packet(f)) return FALSE0; |
3627 | do { |
3628 | len = next_segment(f); |
3629 | skip(f, len); |
3630 | f->bytes_in_seg = 0; |
3631 | } while (len); |
3632 | |
3633 | // third packet! |
3634 | if (!start_packet(f)) return FALSE0; |
3635 | |
3636 | #ifndef STB_VORBIS_NO_PUSHDATA_API |
3637 | if (IS_PUSH_MODE(f)((f)->push_mode)) { |
3638 | if (!is_whole_packet_present(f, TRUE1)) { |
3639 | // convert error in ogg header to write type |
3640 | if (f->error == VORBIS_invalid_stream) |
3641 | f->error = VORBIS_invalid_setup; |
3642 | return FALSE0; |
3643 | } |
3644 | } |
3645 | #endif |
3646 | |
3647 | crc32_init(); // always init it, to avoid multithread race conditions |
3648 | |
3649 | if (get8_packet(f) != VORBIS_packet_setup) return error(f, VORBIS_invalid_setup); |
3650 | for (i=0; i < 6; ++i) header[i] = get8_packet(f); |
3651 | if (!vorbis_validate(header)) return error(f, VORBIS_invalid_setup); |
3652 | |
3653 | // codebooks |
3654 | |
3655 | f->codebook_count = get_bits(f,8) + 1; |
3656 | f->codebooks = (Codebook *) setup_malloc(f, sizeof(*f->codebooks) * f->codebook_count); |
3657 | if (f->codebooks == NULL((void*)0)) return error(f, VORBIS_outofmem); |
3658 | memset(f->codebooks, 0, sizeof(*f->codebooks) * f->codebook_count); |
3659 | for (i=0; i < f->codebook_count; ++i) { |
3660 | uint32 *values; |
3661 | int ordered, sorted_count; |
3662 | int total=0; |
3663 | uint8 *lengths; |
3664 | Codebook *c = f->codebooks+i; |
3665 | x = get_bits(f, 8); if (x != 0x42) return error(f, VORBIS_invalid_setup); |
3666 | x = get_bits(f, 8); if (x != 0x43) return error(f, VORBIS_invalid_setup); |
3667 | x = get_bits(f, 8); if (x != 0x56) return error(f, VORBIS_invalid_setup); |
3668 | x = get_bits(f, 8); |
3669 | c->dimensions = (get_bits(f, 8)<<8) + x; |
3670 | x = get_bits(f, 8); |
3671 | y = get_bits(f, 8); |
3672 | c->entries = (get_bits(f, 8)<<16) + (y<<8) + x; |
3673 | ordered = get_bits(f,1); |
3674 | c->sparse = ordered ? 0 : get_bits(f,1); |
3675 | |
3676 | if (c->sparse) |
3677 | lengths = (uint8 *) setup_temp_malloc(f, c->entries); |
3678 | else |
3679 | lengths = c->codeword_lengths = (uint8 *) setup_malloc(f, c->entries); |
3680 | |
3681 | if (!lengths) return error(f, VORBIS_outofmem); |
3682 | |
3683 | if (ordered) { |
3684 | int current_entry = 0; |
3685 | int current_length = get_bits(f,5) + 1; |
3686 | while (current_entry < c->entries) { |
3687 | int limit = c->entries - current_entry; |
3688 | int n = get_bits(f, ilog(limit)); |
3689 | if (current_entry + n > (int) c->entries) { return error(f, VORBIS_invalid_setup); } |
3690 | memset(lengths + current_entry, current_length, n); |
3691 | current_entry += n; |
3692 | ++current_length; |
3693 | } |
3694 | } else { |
3695 | for (j=0; j < c->entries; ++j) { |
3696 | int present = c->sparse ? get_bits(f,1) : 1; |
3697 | if (present) { |
3698 | lengths[j] = get_bits(f, 5) + 1; |
3699 | ++total; |
3700 | } else { |
3701 | lengths[j] = NO_CODE255; |
3702 | } |
3703 | } |
3704 | } |
3705 | |
3706 | if (c->sparse && total >= c->entries >> 2) { |
3707 | // convert sparse items to non-sparse! |
3708 | if (c->entries > (int) f->setup_temp_memory_required) |
3709 | f->setup_temp_memory_required = c->entries; |
3710 | |
3711 | c->codeword_lengths = (uint8 *) setup_malloc(f, c->entries); |
3712 | memcpy(c->codeword_lengths, lengths, c->entries); |
3713 | setup_temp_free(f, lengths, c->entries); // note this is only safe if there have been no intervening temp mallocs! |
3714 | lengths = c->codeword_lengths; |
3715 | c->sparse = 0; |
3716 | } |
3717 | |
3718 | // compute the size of the sorted tables |
3719 | if (c->sparse) { |
3720 | sorted_count = total; |
3721 | //assert(total != 0); |
3722 | } else { |
3723 | sorted_count = 0; |
3724 | #ifndef STB_VORBIS_NO_HUFFMAN_BINARY_SEARCH |
3725 | for (j=0; j < c->entries; ++j) |
3726 | if (lengths[j] > STB_VORBIS_FAST_HUFFMAN_LENGTH10 && lengths[j] != NO_CODE255) |
3727 | ++sorted_count; |
3728 | #endif |
3729 | } |
3730 | |
3731 | c->sorted_entries = sorted_count; |
3732 | values = NULL((void*)0); |
3733 | |
3734 | if (!c->sparse) { |
3735 | c->codewords = (uint32 *) setup_malloc(f, sizeof(c->codewords[0]) * c->entries); |
3736 | if (!c->codewords) return error(f, VORBIS_outofmem); |
3737 | } else { |
3738 | unsigned int size; |
3739 | if (c->sorted_entries) { |
3740 | c->codeword_lengths = (uint8 *) setup_malloc(f, c->sorted_entries); |
3741 | if (!c->codeword_lengths) return error(f, VORBIS_outofmem); |
3742 | c->codewords = (uint32 *) setup_temp_malloc(f, sizeof(*c->codewords) * c->sorted_entries); |
3743 | if (!c->codewords) return error(f, VORBIS_outofmem); |
3744 | values = (uint32 *) setup_temp_malloc(f, sizeof(*values) * c->sorted_entries); |
3745 | if (!values) return error(f, VORBIS_outofmem); |
3746 | } |
3747 | size = c->entries + (sizeof(*c->codewords) + sizeof(*values)) * c->sorted_entries; |
3748 | if (size > f->setup_temp_memory_required) |
3749 | f->setup_temp_memory_required = size; |
3750 | } |
3751 | |
3752 | if (!compute_codewords(c, lengths, c->entries, values)) { |
3753 | if (c->sparse) setup_temp_free(f, values, 0); |
3754 | return error(f, VORBIS_invalid_setup); |
3755 | } |
3756 | |
3757 | if (c->sorted_entries) { |
3758 | // allocate an extra slot for sentinels |
3759 | c->sorted_codewords = (uint32 *) setup_malloc(f, sizeof(*c->sorted_codewords) * (c->sorted_entries+1)); |
3760 | // allocate an extra slot at the front so that c->sorted_values[-1] is defined |
3761 | // so that we can catch that case without an extra if |
3762 | c->sorted_values = ( int *) setup_malloc(f, sizeof(*c->sorted_values ) * (c->sorted_entries+1)); |
3763 | if (c->sorted_values) { ++c->sorted_values; c->sorted_values[-1] = -1; } |
3764 | compute_sorted_huffman(c, lengths, values); |
3765 | } |
3766 | |
3767 | if (c->sparse) { |
3768 | setup_temp_free(f, values, sizeof(*values)*c->sorted_entries); |
3769 | setup_temp_free(f, c->codewords, sizeof(*c->codewords)*c->sorted_entries); |
3770 | setup_temp_free(f, lengths, c->entries); |
3771 | c->codewords = NULL((void*)0); |
3772 | } |
3773 | |
3774 | compute_accelerated_huffman(c); |
3775 | |
3776 | c->lookup_type = get_bits(f, 4); |
3777 | if (c->lookup_type > 2) return error(f, VORBIS_invalid_setup); |
3778 | if (c->lookup_type > 0) { |
3779 | uint16 *mults; |
3780 | c->minimum_value = float32_unpack(get_bits(f, 32)); |
3781 | c->delta_value = float32_unpack(get_bits(f, 32)); |
3782 | c->value_bits = get_bits(f, 4)+1; |
3783 | c->sequence_p = get_bits(f,1); |
3784 | if (c->lookup_type == 1) { |
3785 | c->lookup_values = lookup1_values(c->entries, c->dimensions); |
3786 | } else { |
3787 | c->lookup_values = c->entries * c->dimensions; |
3788 | } |
3789 | mults = (uint16 *) setup_temp_malloc(f, sizeof(mults[0]) * c->lookup_values); |
3790 | if (mults == NULL((void*)0)) return error(f, VORBIS_outofmem); |
3791 | for (j=0; j < (int) c->lookup_values; ++j) { |
3792 | int q = get_bits(f, c->value_bits); |
3793 | if (q == EOP(-1)) { setup_temp_free(f,mults,sizeof(mults[0])*c->lookup_values); return error(f, VORBIS_invalid_setup); } |
3794 | mults[j] = q; |
3795 | } |
3796 | |
3797 | #ifndef STB_VORBIS_DIVIDES_IN_CODEBOOK |
3798 | if (c->lookup_type == 1) { |
3799 | int len, sparse = c->sparse; |
3800 | // pre-expand the lookup1-style multiplicands, to avoid a divide in the inner loop |
3801 | if (sparse) { |
3802 | if (c->sorted_entries == 0) goto skip; |
3803 | c->multiplicands = (codetype *) setup_malloc(f, sizeof(c->multiplicands[0]) * c->sorted_entries * c->dimensions); |
3804 | } else |
3805 | c->multiplicands = (codetype *) setup_malloc(f, sizeof(c->multiplicands[0]) * c->entries * c->dimensions); |
3806 | if (c->multiplicands == NULL((void*)0)) { setup_temp_free(f,mults,sizeof(mults[0])*c->lookup_values); return error(f, VORBIS_outofmem); } |
3807 | len = sparse ? c->sorted_entries : c->entries; |
3808 | for (j=0; j < len; ++j) { |
3809 | int z = sparse ? c->sorted_values[j] : j, div=1; |
3810 | for (k=0; k < c->dimensions; ++k) { |
3811 | int off = (z / div) % c->lookup_values; |
3812 | c->multiplicands[j*c->dimensions + k] = |
3813 | #ifndef STB_VORBIS_CODEBOOK_FLOATS |
3814 | mults[off]; |
3815 | #else |
3816 | mults[off]*c->delta_value + c->minimum_value; |
3817 | // in this case (and this case only) we could pre-expand c->sequence_p, |
3818 | // and throw away the decode logic for it; have to ALSO do |
3819 | // it in the case below, but it can only be done if |
3820 | // STB_VORBIS_CODEBOOK_FLOATS |
3821 | // !STB_VORBIS_DIVIDES_IN_CODEBOOK |
3822 | #endif |
3823 | div *= c->lookup_values; |
3824 | } |
3825 | } |
3826 | setup_temp_free(f, mults,sizeof(mults[0])*c->lookup_values); |
3827 | c->lookup_type = 2; |
3828 | } |
3829 | else |
3830 | #endif |
3831 | { |
3832 | c->multiplicands = (codetype *) setup_malloc(f, sizeof(c->multiplicands[0]) * c->lookup_values); |
3833 | #ifndef STB_VORBIS_CODEBOOK_FLOATS |
3834 | memcpy(c->multiplicands, mults, sizeof(c->multiplicands[0]) * c->lookup_values); |
3835 | #else |
3836 | for (j=0; j < (int) c->lookup_values; ++j) |
3837 | c->multiplicands[j] = mults[j] * c->delta_value + c->minimum_value; |
3838 | setup_temp_free(f, mults,sizeof(mults[0])*c->lookup_values); |
3839 | #endif |
3840 | } |
3841 | skip:; |
3842 | |
3843 | #ifdef STB_VORBIS_CODEBOOK_FLOATS |
3844 | if (c->lookup_type == 2 && c->sequence_p) { |
3845 | for (j=1; j < (int) c->lookup_values; ++j) |
3846 | c->multiplicands[j] = c->multiplicands[j-1]; |
3847 | c->sequence_p = 0; |
3848 | } |
3849 | #endif |
3850 | } |
3851 | } |
3852 | |
3853 | // time domain transfers (notused) |
3854 | |
3855 | x = get_bits(f, 6) + 1; |
3856 | for (i=0; i < x; ++i) { |
3857 | uint32 z = get_bits(f, 16); |
3858 | if (z != 0) return error(f, VORBIS_invalid_setup); |
3859 | } |
3860 | |
3861 | // Floors |
3862 | f->floor_count = get_bits(f, 6)+1; |
3863 | f->floor_config = (Floor *) setup_malloc(f, f->floor_count * sizeof(*f->floor_config)); |
3864 | for (i=0; i < f->floor_count; ++i) { |
3865 | f->floor_types[i] = get_bits(f, 16); |
3866 | if (f->floor_types[i] > 1) return error(f, VORBIS_invalid_setup); |
3867 | if (f->floor_types[i] == 0) { |
3868 | Floor0 *g = &f->floor_config[i].floor0; |
3869 | g->order = get_bits(f,8); |
3870 | g->rate = get_bits(f,16); |
3871 | g->bark_map_size = get_bits(f,16); |
3872 | g->amplitude_bits = get_bits(f,6); |
3873 | g->amplitude_offset = get_bits(f,8); |
3874 | g->number_of_books = get_bits(f,4) + 1; |
3875 | for (j=0; j < g->number_of_books; ++j) |
3876 | g->book_list[j] = get_bits(f,8); |
3877 | return error(f, VORBIS_feature_not_supported); |
3878 | } else { |
3879 | Point p[31*8+2]; |
3880 | Floor1 *g = &f->floor_config[i].floor1; |
3881 | int max_class = -1; |
3882 | g->partitions = get_bits(f, 5); |
3883 | for (j=0; j < g->partitions; ++j) { |
3884 | g->partition_class_list[j] = get_bits(f, 4); |
3885 | if (g->partition_class_list[j] > max_class) |
3886 | max_class = g->partition_class_list[j]; |
3887 | } |
3888 | for (j=0; j <= max_class; ++j) { |
3889 | g->class_dimensions[j] = get_bits(f, 3)+1; |
3890 | g->class_subclasses[j] = get_bits(f, 2); |
3891 | if (g->class_subclasses[j]) { |
3892 | g->class_masterbooks[j] = get_bits(f, 8); |
3893 | if (g->class_masterbooks[j] >= f->codebook_count) return error(f, VORBIS_invalid_setup); |
3894 | } |
3895 | for (k=0; k < 1 << g->class_subclasses[j]; ++k) { |
3896 | g->subclass_books[j][k] = get_bits(f,8)-1; |
3897 | if (g->subclass_books[j][k] >= f->codebook_count) return error(f, VORBIS_invalid_setup); |
3898 | } |
3899 | } |
3900 | g->floor1_multiplier = get_bits(f,2)+1; |
3901 | g->rangebits = get_bits(f,4); |
3902 | g->Xlist[0] = 0; |
3903 | g->Xlist[1] = 1 << g->rangebits; |
3904 | g->values = 2; |
3905 | for (j=0; j < g->partitions; ++j) { |
3906 | int c = g->partition_class_list[j]; |
3907 | for (k=0; k < g->class_dimensions[c]; ++k) { |
3908 | g->Xlist[g->values] = get_bits(f, g->rangebits); |
3909 | ++g->values; |
3910 | } |
3911 | } |
3912 | // precompute the sorting |
3913 | for (j=0; j < g->values; ++j) { |
3914 | p[j].x = g->Xlist[j]; |
3915 | p[j].y = j; |
3916 | } |
3917 | qsort(p, g->values, sizeof(p[0]), point_compare); |
3918 | for (j=0; j < g->values; ++j) |
3919 | g->sorted_order[j] = (uint8) p[j].y; |
3920 | // precompute the neighbors |
3921 | for (j=2; j < g->values; ++j) { |
3922 | int low,hi; |
3923 | neighbors(g->Xlist, j, &low,&hi); |
3924 | g->neighbors[j][0] = low; |
3925 | g->neighbors[j][1] = hi; |
3926 | } |
3927 | |
3928 | if (g->values > longest_floorlist) |
3929 | longest_floorlist = g->values; |
3930 | } |
3931 | } |
3932 | |
3933 | // Residue |
3934 | f->residue_count = get_bits(f, 6)+1; |
3935 | f->residue_config = (Residue *) setup_malloc(f, f->residue_count * sizeof(*f->residue_config)); |
3936 | for (i=0; i < f->residue_count; ++i) { |
3937 | uint8 residue_cascade[64]; |
3938 | Residue *r = f->residue_config+i; |
3939 | f->residue_types[i] = get_bits(f, 16); |
3940 | if (f->residue_types[i] > 2) return error(f, VORBIS_invalid_setup); |
3941 | r->begin = get_bits(f, 24); |
3942 | r->end = get_bits(f, 24); |
3943 | r->part_size = get_bits(f,24)+1; |
3944 | r->classifications = get_bits(f,6)+1; |
3945 | r->classbook = get_bits(f,8); |
3946 | for (j=0; j < r->classifications; ++j) { |
3947 | uint8 high_bits=0; |
3948 | uint8 low_bits=get_bits(f,3); |
3949 | if (get_bits(f,1)) |
3950 | high_bits = get_bits(f,5); |
3951 | residue_cascade[j] = high_bits*8 + low_bits; |
3952 | } |
3953 | r->residue_books = (short (*)[8]) setup_malloc(f, sizeof(r->residue_books[0]) * r->classifications); |
3954 | for (j=0; j < r->classifications; ++j) { |
3955 | for (k=0; k < 8; ++k) { |
3956 | if (residue_cascade[j] & (1 << k)) { |
3957 | r->residue_books[j][k] = get_bits(f, 8); |
3958 | if (r->residue_books[j][k] >= f->codebook_count) return error(f, VORBIS_invalid_setup); |
3959 | } else { |
3960 | r->residue_books[j][k] = -1; |
3961 | } |
3962 | } |
3963 | } |
3964 | // precompute the classifications[] array to avoid inner-loop mod/divide |
3965 | // call it 'classdata' since we already have r->classifications |
3966 | r->classdata = (uint8 **) setup_malloc(f, sizeof(*r->classdata) * f->codebooks[r->classbook].entries); |
3967 | if (!r->classdata) return error(f, VORBIS_outofmem); |
3968 | memset(r->classdata, 0, sizeof(*r->classdata) * f->codebooks[r->classbook].entries); |
3969 | for (j=0; j < f->codebooks[r->classbook].entries; ++j) { |
3970 | int classwords = f->codebooks[r->classbook].dimensions; |
3971 | int temp = j; |
3972 | r->classdata[j] = (uint8 *) setup_malloc(f, sizeof(r->classdata[j][0]) * classwords); |
3973 | for (k=classwords-1; k >= 0; --k) { |
3974 | r->classdata[j][k] = temp % r->classifications; |
3975 | temp /= r->classifications; |
3976 | } |
3977 | } |
3978 | } |
3979 | |
3980 | f->mapping_count = get_bits(f,6)+1; |
3981 | f->mapping = (Mapping *) setup_malloc(f, f->mapping_count * sizeof(*f->mapping)); |
3982 | for (i=0; i < f->mapping_count; ++i) { |
3983 | Mapping *m = f->mapping + i; |
3984 | int mapping_type = get_bits(f,16); |
3985 | if (mapping_type != 0) return error(f, VORBIS_invalid_setup); |
3986 | m->chan = (MappingChannel *) setup_malloc(f, f->channels * sizeof(*m->chan)); |
3987 | if (get_bits(f,1)) |
3988 | m->submaps = get_bits(f,4); |
3989 | else |
3990 | m->submaps = 1; |
3991 | if (m->submaps > max_submaps) |
3992 | max_submaps = m->submaps; |
3993 | if (get_bits(f,1)) { |
3994 | m->coupling_steps = get_bits(f,8)+1; |
3995 | for (k=0; k < m->coupling_steps; ++k) { |
3996 | m->chan[k].magnitude = get_bits(f, ilog(f->channels)-1); |
3997 | m->chan[k].angle = get_bits(f, ilog(f->channels)-1); |
3998 | if (m->chan[k].magnitude >= f->channels) return error(f, VORBIS_invalid_setup); |
3999 | if (m->chan[k].angle >= f->channels) return error(f, VORBIS_invalid_setup); |
4000 | if (m->chan[k].magnitude == m->chan[k].angle) return error(f, VORBIS_invalid_setup); |
4001 | } |
4002 | } else |
4003 | m->coupling_steps = 0; |
4004 | |
4005 | // reserved field |
4006 | if (get_bits(f,2)) return error(f, VORBIS_invalid_setup); |
4007 | if (m->submaps > 1) { |
4008 | for (j=0; j < f->channels; ++j) { |
4009 | m->chan[j].mux = get_bits(f, 4); |
4010 | if (m->chan[j].mux >= m->submaps) return error(f, VORBIS_invalid_setup); |
4011 | } |
4012 | } else |
4013 | // @SPECIFICATION: this case is missing from the spec |
4014 | for (j=0; j < f->channels; ++j) |
4015 | m->chan[j].mux = 0; |
4016 | |
4017 | for (j=0; j < m->submaps; ++j) { |
4018 | get_bits(f,8); // discard |
4019 | m->submap_floor[j] = get_bits(f,8); |
4020 | m->submap_residue[j] = get_bits(f,8); |
4021 | if (m->submap_floor[j] >= f->floor_count) return error(f, VORBIS_invalid_setup); |
4022 | if (m->submap_residue[j] >= f->residue_count) return error(f, VORBIS_invalid_setup); |
4023 | } |
4024 | } |
4025 | |
4026 | // Modes |
4027 | f->mode_count = get_bits(f, 6)+1; |
4028 | for (i=0; i < f->mode_count; ++i) { |
4029 | Mode *m = f->mode_config+i; |
4030 | m->blockflag = get_bits(f,1); |
4031 | m->windowtype = get_bits(f,16); |
4032 | m->transformtype = get_bits(f,16); |
4033 | m->mapping = get_bits(f,8); |
4034 | if (m->windowtype != 0) return error(f, VORBIS_invalid_setup); |
4035 | if (m->transformtype != 0) return error(f, VORBIS_invalid_setup); |
4036 | if (m->mapping >= f->mapping_count) return error(f, VORBIS_invalid_setup); |
4037 | } |
4038 | |
4039 | flush_packet(f); |
4040 | |
4041 | f->previous_length = 0; |
4042 | |
4043 | for (i=0; i < f->channels; ++i) { |
4044 | f->channel_buffers[i] = (float *) setup_malloc(f, sizeof(float) * f->blocksize_1); |
4045 | f->previous_window[i] = (float *) setup_malloc(f, sizeof(float) * f->blocksize_1/2); |
4046 | f->finalY[i] = (int16 *) setup_malloc(f, sizeof(int16) * longest_floorlist); |
4047 | #ifdef STB_VORBIS_NO_DEFER_FLOOR |
4048 | f->floor_buffers[i] = (float *) setup_malloc(f, sizeof(float) * f->blocksize_1/2); |
4049 | #endif |
4050 | } |
4051 | |
4052 | if (!init_blocksize(f, 0, f->blocksize_0)) return FALSE0; |
4053 | if (!init_blocksize(f, 1, f->blocksize_1)) return FALSE0; |
4054 | f->blocksize[0] = f->blocksize_0; |
4055 | f->blocksize[1] = f->blocksize_1; |
4056 | |
4057 | #ifdef STB_VORBIS_DIVIDE_TABLE |
4058 | if (integer_divide_table[1][1]==0) |
4059 | for (i=0; i < DIVTAB_NUMER; ++i) |
4060 | for (j=1; j < DIVTAB_DENOM; ++j) |
4061 | integer_divide_table[i][j] = i / j; |
4062 | #endif |
4063 | |
4064 | // compute how much temporary memory is needed |
4065 | |
4066 | // 1. |
4067 | { |
4068 | uint32 imdct_mem = (f->blocksize_1 * sizeof(float) >> 1); |
4069 | uint32 classify_mem; |
4070 | int i,max_part_read=0; |
4071 | for (i=0; i < f->residue_count; ++i) { |
4072 | Residue *r = f->residue_config + i; |
4073 | int n_read = r->end - r->begin; |
4074 | int part_read = n_read / r->part_size; |
4075 | if (part_read > max_part_read) |
4076 | max_part_read = part_read; |
4077 | } |
4078 | #ifndef STB_VORBIS_DIVIDES_IN_RESIDUE |
4079 | classify_mem = f->channels * (sizeof(void*) + max_part_read * sizeof(uint8 *)); |
4080 | #else |
4081 | classify_mem = f->channels * (sizeof(void*) + max_part_read * sizeof(int *)); |
4082 | #endif |
4083 | |
4084 | f->temp_memory_required = classify_mem; |
4085 | if (imdct_mem > f->temp_memory_required) |
4086 | f->temp_memory_required = imdct_mem; |
4087 | } |
4088 | |
4089 | f->first_decode = TRUE1; |
4090 | |
4091 | if (f->alloc.alloc_buffer) { |
4092 | assert(f->temp_offset == f->alloc.alloc_buffer_length_in_bytes)((f->temp_offset == f->alloc.alloc_buffer_length_in_bytes ) ? (void)0 : _assert("f->temp_offset == f->alloc.alloc_buffer_length_in_bytes" , "src/siege/internal/stb/stb_vorbis.c", 4092)); |
4093 | // check if there's enough temp memory so we don't error later |
4094 | if (f->setup_offset + sizeof(*f) + f->temp_memory_required > (unsigned) f->temp_offset) |
4095 | return error(f, VORBIS_outofmem); |
4096 | } |
4097 | |
4098 | f->first_audio_page_offset = stb_vorbis_get_file_offset(f); |
4099 | |
4100 | return TRUE1; |
4101 | } |
4102 | |
4103 | static void vorbis_deinit(stb_vorbis *p) |
4104 | { |
4105 | int i,j; |
4106 | for (i=0; i < p->residue_count; ++i) { |
4107 | Residue *r = p->residue_config+i; |
4108 | if (r->classdata) { |
4109 | for (j=0; j < p->codebooks[r->classbook].entries; ++j) |
4110 | setup_free(p, r->classdata[j]); |
4111 | setup_free(p, r->classdata); |
4112 | } |
4113 | setup_free(p, r->residue_books); |
4114 | } |
4115 | |
4116 | if (p->codebooks) { |
4117 | for (i=0; i < p->codebook_count; ++i) { |
4118 | Codebook *c = p->codebooks + i; |
4119 | setup_free(p, c->codeword_lengths); |
4120 | setup_free(p, c->multiplicands); |
4121 | setup_free(p, c->codewords); |
4122 | setup_free(p, c->sorted_codewords); |
4123 | // c->sorted_values[-1] is the first entry in the array |
4124 | setup_free(p, c->sorted_values ? c->sorted_values-1 : NULL((void*)0)); |
4125 | } |
4126 | setup_free(p, p->codebooks); |
4127 | } |
4128 | setup_free(p, p->floor_config); |
4129 | setup_free(p, p->residue_config); |
4130 | for (i=0; i < p->mapping_count; ++i) |
4131 | setup_free(p, p->mapping[i].chan); |
4132 | setup_free(p, p->mapping); |
4133 | for (i=0; i < p->channels; ++i) { |
4134 | setup_free(p, p->channel_buffers[i]); |
4135 | setup_free(p, p->previous_window[i]); |
4136 | #ifdef STB_VORBIS_NO_DEFER_FLOOR |
4137 | setup_free(p, p->floor_buffers[i]); |
4138 | #endif |
4139 | setup_free(p, p->finalY[i]); |
4140 | } |
4141 | for (i=0; i < 2; ++i) { |
4142 | setup_free(p, p->A[i]); |
4143 | setup_free(p, p->B[i]); |
4144 | setup_free(p, p->C(2 | 4 | 1)[i]); |
4145 | setup_free(p, p->window[i]); |
4146 | } |
4147 | #ifndef STB_VORBIS_NO_STDIO |
4148 | if (p->close_on_free) fclose(p->f); |
4149 | #endif |
4150 | } |
4151 | |
4152 | void stb_vorbis_close(stb_vorbis *p) |
4153 | { |
4154 | if (p == NULL((void*)0)) return; |
4155 | vorbis_deinit(p); |
4156 | setup_free(p,p); |
4157 | } |
4158 | |
4159 | static void vorbis_init(stb_vorbis *p, stb_vorbis_alloc *z) |
4160 | { |
4161 | memset(p, 0, sizeof(*p)); // NULL out all malloc'd pointers to start |
4162 | if (z) { |
4163 | p->alloc = *z; |
4164 | p->alloc.alloc_buffer_length_in_bytes = (p->alloc.alloc_buffer_length_in_bytes+3) & ~3; |
4165 | p->temp_offset = p->alloc.alloc_buffer_length_in_bytes; |
4166 | } |
4167 | p->eof = 0; |
4168 | p->error = VORBIS__no_error; |
4169 | p->stream = NULL((void*)0); |
4170 | p->codebooks = NULL((void*)0); |
4171 | p->page_crc_tests = -1; |
4172 | #ifndef STB_VORBIS_NO_STDIO |
4173 | p->close_on_free = FALSE0; |
4174 | p->f = NULL((void*)0); |
4175 | #endif |
4176 | } |
4177 | |
4178 | int stb_vorbis_get_sample_offset(stb_vorbis *f) |
4179 | { |
4180 | if (f->current_loc_valid) |
4181 | return f->current_loc; |
4182 | else |
4183 | return -1; |
4184 | } |
4185 | |
4186 | stb_vorbis_info stb_vorbis_get_info(stb_vorbis *f) |
4187 | { |
4188 | stb_vorbis_info d; |
4189 | d.channels = f->channels; |
4190 | d.sample_rate = f->sample_rate; |
4191 | d.setup_memory_required = f->setup_memory_required; |
4192 | d.setup_temp_memory_required = f->setup_temp_memory_required; |
4193 | d.temp_memory_required = f->temp_memory_required; |
4194 | d.max_frame_size = f->blocksize_1 >> 1; |
4195 | return d; |
4196 | } |
4197 | |
4198 | int stb_vorbis_get_error(stb_vorbis *f) |
4199 | { |
4200 | int e = f->error; |
4201 | f->error = VORBIS__no_error; |
4202 | return e; |
4203 | } |
4204 | |
4205 | static stb_vorbis * vorbis_alloc(stb_vorbis *f) |
4206 | { |
4207 | stb_vorbis *p = (stb_vorbis *) setup_malloc(f, sizeof(*p)); |
4208 | return p; |
4209 | } |
4210 | |
4211 | #ifndef STB_VORBIS_NO_PUSHDATA_API |
4212 | |
4213 | void stb_vorbis_flush_pushdata(stb_vorbis *f) |
4214 | { |
4215 | f->previous_length = 0; |
4216 | f->page_crc_tests = 0; |
4217 | f->discard_samples_deferred = 0; |
4218 | f->current_loc_valid = FALSE0; |
4219 | f->first_decode = FALSE0; |
4220 | f->samples_output = 0; |
4221 | f->channel_buffer_start = 0; |
4222 | f->channel_buffer_end = 0; |
4223 | } |
4224 | |
4225 | static int vorbis_search_for_page_pushdata(vorb *f, uint8 *data, int data_len) |
4226 | { |
4227 | int i,n; |
4228 | for (i=0; i < f->page_crc_tests; ++i) |
4229 | f->scan[i].bytes_done = 0; |
4230 | |
4231 | // if we have room for more scans, search for them first, because |
4232 | // they may cause us to stop early if their header is incomplete |
4233 | if (f->page_crc_tests < STB_VORBIS_PUSHDATA_CRC_COUNT4) { |
4234 | if (data_len < 4) return 0; |
4235 | data_len -= 3; // need to look for 4-byte sequence, so don't miss |
4236 | // one that straddles a boundary |
4237 | for (i=0; i < data_len; ++i) { |
4238 | if (data[i] == 0x4f) { |
4239 | if (0==memcmp(data+i, ogg_page_header, 4)) { |
4240 | int j,len; |
4241 | uint32 crc; |
4242 | // make sure we have the whole page header |
4243 | if (i+26 >= data_len || i+27+data[i+26] >= data_len) { |
4244 | // only read up to this page start, so hopefully we'll |
4245 | // have the whole page header start next time |
4246 | data_len = i; |
4247 | break; |
4248 | } |
4249 | // ok, we have it all; compute the length of the page |
4250 | len = 27 + data[i+26]; |
4251 | for (j=0; j < data[i+26]; ++j) |
4252 | len += data[i+27+j]; |
4253 | // scan everything up to the embedded crc (which we must 0) |
4254 | crc = 0; |
4255 | for (j=0; j < 22; ++j) |
4256 | crc = crc32_update(crc, data[i+j]); |
4257 | // now process 4 0-bytes |
4258 | for ( ; j < 26; ++j) |
4259 | crc = crc32_update(crc, 0); |
4260 | // len is the total number of bytes we need to scan |
4261 | n = f->page_crc_tests++; |
4262 | f->scan[n].bytes_left = len-j; |
4263 | f->scan[n].crc_so_far = crc; |
4264 | f->scan[n].goal_crc = data[i+22] + (data[i+23] << 8) + (data[i+24]<<16) + (data[i+25]<<24); |
4265 | // if the last frame on a page is continued to the next, then |
4266 | // we can't recover the sample_loc immediately |
4267 | if (data[i+27+data[i+26]-1] == 255) |
4268 | f->scan[n].sample_loc = ~0; |
4269 | else |
4270 | f->scan[n].sample_loc = data[i+6] + (data[i+7] << 8) + (data[i+ 8]<<16) + (data[i+ 9]<<24); |
4271 | f->scan[n].bytes_done = i+j; |
4272 | if (f->page_crc_tests == STB_VORBIS_PUSHDATA_CRC_COUNT4) |
4273 | break; |
4274 | // keep going if we still have room for more |
4275 | } |
4276 | } |
4277 | } |
4278 | } |
4279 | |
4280 | for (i=0; i < f->page_crc_tests;) { |
4281 | uint32 crc; |
4282 | int j; |
4283 | int n = f->scan[i].bytes_done; |
4284 | int m = f->scan[i].bytes_left; |
4285 | if (m > data_len - n) m = data_len - n; |
4286 | // m is the bytes to scan in the current chunk |
4287 | crc = f->scan[i].crc_so_far; |
4288 | for (j=0; j < m; ++j) |
4289 | crc = crc32_update(crc, data[n+j]); |
4290 | f->scan[i].bytes_left -= m; |
4291 | f->scan[i].crc_so_far = crc; |
4292 | if (f->scan[i].bytes_left == 0) { |
4293 | // does it match? |
4294 | if (f->scan[i].crc_so_far == f->scan[i].goal_crc) { |
4295 | // Houston, we have page |
4296 | data_len = n+m; // consumption amount is wherever that scan ended |
4297 | f->page_crc_tests = -1; // drop out of page scan mode |
4298 | f->previous_length = 0; // decode-but-don't-output one frame |
4299 | f->next_seg = -1; // start a new page |
4300 | f->current_loc = f->scan[i].sample_loc; // set the current sample location |
4301 | // to the amount we'd have decoded had we decoded this page |
4302 | f->current_loc_valid = f->current_loc != ~0; |
4303 | return data_len; |
4304 | } |
4305 | // delete entry |
4306 | f->scan[i] = f->scan[--f->page_crc_tests]; |
4307 | } else { |
4308 | ++i; |
4309 | } |
4310 | } |
4311 | |
4312 | return data_len; |
4313 | } |
4314 | |
4315 | // return value: number of bytes we used |
4316 | int stb_vorbis_decode_frame_pushdata( |
4317 | stb_vorbis *f, // the file we're decoding |
4318 | uint8 *data, int data_len, // the memory available for decoding |
4319 | int *channels, // place to write number of float * buffers |
4320 | float ***output, // place to write float ** array of float * buffers |
4321 | int *samples // place to write number of output samples |
4322 | ) |
4323 | { |
4324 | int i; |
4325 | int len,right,left; |
4326 | |
4327 | if (!IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); |
4328 | |
4329 | if (f->page_crc_tests >= 0) { |
4330 | *samples = 0; |
4331 | return vorbis_search_for_page_pushdata(f, data, data_len); |
4332 | } |
4333 | |
4334 | f->stream = data; |
4335 | f->stream_end = data + data_len; |
4336 | f->error = VORBIS__no_error; |
4337 | |
4338 | // check that we have the entire packet in memory |
4339 | if (!is_whole_packet_present(f, FALSE0)) { |
4340 | *samples = 0; |
4341 | return 0; |
4342 | } |
4343 | |
4344 | if (!vorbis_decode_packet(f, &len, &left, &right)) { |
4345 | // save the actual error we encountered |
4346 | enum STBVorbisError error = f->error; |
4347 | if (error == VORBIS_bad_packet_type) { |
4348 | // flush and resynch |
4349 | f->error = VORBIS__no_error; |
4350 | while (get8_packet(f) != EOP(-1)) |
4351 | if (f->eof) break; |
4352 | *samples = 0; |
4353 | return f->stream - data; |
4354 | } |
4355 | if (error == VORBIS_continued_packet_flag_invalid) { |
4356 | if (f->previous_length == 0) { |
4357 | // we may be resynching, in which case it's ok to hit one |
4358 | // of these; just discard the packet |
4359 | f->error = VORBIS__no_error; |
4360 | while (get8_packet(f) != EOP(-1)) |
4361 | if (f->eof) break; |
4362 | *samples = 0; |
4363 | return f->stream - data; |
4364 | } |
4365 | } |
4366 | // if we get an error while parsing, what to do? |
4367 | // well, it DEFINITELY won't work to continue from where we are! |
4368 | stb_vorbis_flush_pushdata(f); |
4369 | // restore the error that actually made us bail |
4370 | f->error = error; |
4371 | *samples = 0; |
4372 | return 1; |
4373 | } |
4374 | |
4375 | // success! |
4376 | len = vorbis_finish_frame(f, len, left, right); |
4377 | for (i=0; i < f->channels; ++i) |
4378 | f->outputs[i] = f->channel_buffers[i] + left; |
4379 | |
4380 | if (channels) *channels = f->channels; |
4381 | *samples = len; |
4382 | *output = f->outputs; |
4383 | return f->stream - data; |
4384 | } |
4385 | |
4386 | stb_vorbis *stb_vorbis_open_pushdata( |
4387 | unsigned char *data, int data_len, // the memory available for decoding |
4388 | int *data_used, // only defined if result is not NULL |
4389 | int *error, stb_vorbis_alloc *alloc) |
4390 | { |
4391 | stb_vorbis *f, p; |
4392 | vorbis_init(&p, alloc); |
4393 | p.stream = data; |
4394 | p.stream_end = data + data_len; |
4395 | p.push_mode = TRUE1; |
4396 | if (!start_decoder(&p)) { |
4397 | if (p.eof) |
4398 | *error = VORBIS_need_more_data; |
4399 | else |
4400 | *error = p.error; |
4401 | return NULL((void*)0); |
4402 | } |
4403 | f = vorbis_alloc(&p); |
4404 | if (f) { |
4405 | *f = p; |
4406 | *data_used = f->stream - data; |
4407 | *error = 0; |
4408 | return f; |
4409 | } else { |
4410 | vorbis_deinit(&p); |
4411 | return NULL((void*)0); |
4412 | } |
4413 | } |
4414 | #endif // STB_VORBIS_NO_PUSHDATA_API |
4415 | |
4416 | unsigned int stb_vorbis_get_file_offset(stb_vorbis *f) |
4417 | { |
4418 | #ifndef STB_VORBIS_NO_PUSHDATA_API |
4419 | if (f->push_mode) return 0; |
4420 | #endif |
4421 | if (USE_MEMORY(f)((f)->stream)) return f->stream - f->stream_start; |
4422 | #ifndef STB_VORBIS_NO_STDIO |
4423 | return ftell(f->f) - f->f_start; |
4424 | #endif |
4425 | } |
4426 | |
4427 | #ifndef STB_VORBIS_NO_PULLDATA_API |
4428 | // |
4429 | // DATA-PULLING API |
4430 | // |
4431 | |
4432 | static uint32 vorbis_find_page(stb_vorbis *f, uint32 *end, uint32 *last) |
4433 | { |
4434 | for(;;) { |
4435 | int n; |
4436 | if (f->eof) return 0; |
4437 | n = get8(f); |
4438 | if (n == 0x4f) { // page header |
4439 | unsigned int retry_loc = stb_vorbis_get_file_offset(f); |
4440 | int i; |
4441 | // check if we're off the end of a file_section stream |
4442 | if (retry_loc - 25 > f->stream_len) |
4443 | return 0; |
4444 | // check the rest of the header |
4445 | for (i=1; i < 4; ++i) |
4446 | if (get8(f) != ogg_page_header[i]) |
4447 | break; |
4448 | if (f->eof) return 0; |
4449 | if (i == 4) { |
4450 | uint8 header[27]; |
4451 | uint32 i, crc, goal, len; |
4452 | for (i=0; i < 4; ++i) |
4453 | header[i] = ogg_page_header[i]; |
4454 | for (; i < 27; ++i) |
4455 | header[i] = get8(f); |
4456 | if (f->eof) return 0; |
4457 | if (header[4] != 0) goto invalid; |
4458 | goal = header[22] + (header[23] << 8) + (header[24]<<16) + (header[25]<<24); |
4459 | for (i=22; i < 26; ++i) |
4460 | header[i] = 0; |
4461 | crc = 0; |
4462 | for (i=0; i < 27; ++i) |
4463 | crc = crc32_update(crc, header[i]); |
4464 | len = 0; |
4465 | for (i=0; i < header[26]; ++i) { |
4466 | int s = get8(f); |
4467 | crc = crc32_update(crc, s); |
4468 | len += s; |
4469 | } |
4470 | if (len && f->eof) return 0; |
4471 | for (i=0; i < len; ++i) |
4472 | crc = crc32_update(crc, get8(f)); |
4473 | // finished parsing probable page |
4474 | if (crc == goal) { |
4475 | // we could now check that it's either got the last |
4476 | // page flag set, OR it's followed by the capture |
4477 | // pattern, but I guess TECHNICALLY you could have |
4478 | // a file with garbage between each ogg page and recover |
4479 | // from it automatically? So even though that paranoia |
4480 | // might decrease the chance of an invalid decode by |
4481 | // another 2^32, not worth it since it would hose those |
4482 | // invalid-but-useful files? |
4483 | if (end) |
4484 | *end = stb_vorbis_get_file_offset(f); |
4485 | if (last) |
4486 | { |
4487 | if (header[5] & 0x04) |
4488 | *last = 1; |
4489 | else |
4490 | *last = 0; |
4491 | } |
4492 | set_file_offset(f, retry_loc-1); |
4493 | return 1; |
4494 | } |
4495 | } |
4496 | invalid: |
4497 | // not a valid page, so rewind and look for next one |
4498 | set_file_offset(f, retry_loc); |
4499 | } |
4500 | } |
4501 | } |
4502 | |
4503 | // seek is implemented with 'interpolation search'--this is like |
4504 | // binary search, but we use the data values to estimate the likely |
4505 | // location of the data item (plus a bit of a bias so when the |
4506 | // estimation is wrong we don't waste overly much time) |
4507 | |
4508 | #define SAMPLE_unknown0xffffffff 0xffffffff |
4509 | |
4510 | |
4511 | // ogg vorbis, in its insane infinite wisdom, only provides |
4512 | // information about the sample at the END of the page. |
4513 | // therefore we COULD have the data we need in the current |
4514 | // page, and not know it. we could just use the end location |
4515 | // as our only knowledge for bounds, seek back, and eventually |
4516 | // the binary search finds it. or we can try to be smart and |
4517 | // not waste time trying to locate more pages. we try to be |
4518 | // smart, since this data is already in memory anyway, so |
4519 | // doing needless I/O would be crazy! |
4520 | static int vorbis_analyze_page(stb_vorbis *f, ProbedPage *z) |
4521 | { |
4522 | uint8 header[27], lacing[255]; |
4523 | uint8 packet_type[255]; |
4524 | int num_packet, packet_start, previous =0; |
4525 | (void)previous; |
4526 | int i,len; |
4527 | uint32 samples; |
4528 | |
4529 | // record where the page starts |
4530 | z->page_start = stb_vorbis_get_file_offset(f); |
4531 | |
4532 | // parse the header |
4533 | getn(f, header, 27); |
4534 | assert(header[0] == 'O' && header[1] == 'g' && header[2] == 'g' && header[3] == 'S')((header[0] == 'O' && header[1] == 'g' && header [2] == 'g' && header[3] == 'S') ? (void)0 : _assert("header[0] == 'O' && header[1] == 'g' && header[2] == 'g' && header[3] == 'S'" , "src/siege/internal/stb/stb_vorbis.c", 4534)); |
4535 | getn(f, lacing, header[26]); |
4536 | |
4537 | // determine the length of the payload |
4538 | len = 0; |
4539 | for (i=0; i < header[26]; ++i) |
4540 | len += lacing[i]; |
4541 | |
4542 | // this implies where the page ends |
4543 | z->page_end = z->page_start + 27 + header[26] + len; |
4544 | |
4545 | // read the last-decoded sample out of the data |
4546 | z->last_decoded_sample = header[6] + (header[7] << 8) + (header[8] << 16) + (header[9] << 16); |
4547 | |
4548 | if (header[5] & 4) { |
4549 | // if this is the last page, it's not possible to work |
4550 | // backwards to figure out the first sample! whoops! fuck. |
4551 | z->first_decoded_sample = SAMPLE_unknown0xffffffff; |
4552 | set_file_offset(f, z->page_start); |
4553 | return 1; |
4554 | } |
4555 | |
4556 | // scan through the frames to determine the sample-count of each one... |
4557 | // our goal is the sample # of the first fully-decoded sample on the |
4558 | // page, which is the first decoded sample of the 2nd page |
4559 | |
4560 | num_packet=0; |
4561 | |
4562 | packet_start = ((header[5] & 1) == 0); |
4563 | |
4564 | for (i=0; i < header[26]; ++i) { |
4565 | if (packet_start) { |
4566 | uint8 n,b,m; |
4567 | if (lacing[i] == 0) goto bail; // trying to read from zero-length packet |
4568 | n = get8(f); |
4569 | // if bottom bit is non-zero, we've got corruption |
4570 | if (n & 1) goto bail; |
4571 | n >>= 1; |
4572 | b = ilog(f->mode_count-1); |
4573 | m = n >> b; |
4574 | n &= (1 << b)-1; |
4575 | if (n >= f->mode_count) goto bail; |
4576 | if (num_packet == 0 && f->mode_config[n].blockflag) |
4577 | previous = (m & 1); |
4578 | packet_type[num_packet++] = f->mode_config[n].blockflag; |
4579 | skip(f, lacing[i]-1); |
4580 | } else |
4581 | skip(f, lacing[i]); |
4582 | packet_start = (lacing[i] < 255); |
4583 | } |
4584 | |
4585 | // now that we know the sizes of all the pages, we can start determining |
4586 | // how much sample data there is. |
4587 | |
4588 | samples = 0; |
4589 | |
4590 | // for the last packet, we step by its whole length, because the definition |
4591 | // is that we encoded the end sample loc of the 'last packet completed', |
4592 | // where 'completed' refers to packets being split, and we are left to guess |
4593 | // what 'end sample loc' means. we assume it means ignoring the fact that |
4594 | // the last half of the data is useless without windowing against the next |
4595 | // packet... (so it's not REALLY complete in that sense) |
4596 | if (num_packet > 1) |
4597 | samples += f->blocksize[packet_type[num_packet-1]]; |
4598 | |
4599 | for (i=num_packet-2; i >= 1; --i) { |
4600 | // now, for this packet, how many samples do we have that |
4601 | // do not overlap the following packet? |
4602 | if (packet_type[i] == 1) |
4603 | if (packet_type[i+1] == 1) |
4604 | samples += f->blocksize_1 >> 1; |
4605 | else |
4606 | samples += ((f->blocksize_1 - f->blocksize_0) >> 2) + (f->blocksize_0 >> 1); |
4607 | else |
4608 | samples += f->blocksize_0 >> 1; |
4609 | } |
4610 | // now, at this point, we've rewound to the very beginning of the |
4611 | // _second_ packet. if we entirely discard the first packet after |
4612 | // a seek, this will be exactly the right sample number. HOWEVER! |
4613 | // we can't as easily compute this number for the LAST page. The |
4614 | // only way to get the sample offset of the LAST page is to use |
4615 | // the end loc from the previous page. But what that returns us |
4616 | // is _exactly_ the place where we get our first non-overlapped |
4617 | // sample. (I think. Stupid spec for being ambiguous.) So for |
4618 | // consistency it's better to do that here, too. However, that |
4619 | // will then require us to NOT discard all of the first frame we |
4620 | // decode, in some cases, which means an even weirder frame size |
4621 | // and extra code. what a fucking pain. |
4622 | |
4623 | // we're going to discard the first packet if we |
4624 | // start the seek here, so we don't care about it. (we could actually |
4625 | // do better; if the first packet is long, and the previous packet |
4626 | // is short, there's actually data in the first half of the first |
4627 | // packet that doesn't need discarding... but not worth paying the |
4628 | // effort of tracking that of that here and in the seeking logic) |
4629 | // except crap, if we infer it from the _previous_ packet's end |
4630 | // location, we DO need to use that definition... and we HAVE to |
4631 | // infer the start loc of the LAST packet from the previous packet's |
4632 | // end location. fuck you, ogg vorbis. |
4633 | |
4634 | z->first_decoded_sample = z->last_decoded_sample - samples; |
4635 | |
4636 | // restore file state to where we were |
4637 | set_file_offset(f, z->page_start); |
4638 | return 1; |
4639 | |
4640 | // restore file state to where we were |
4641 | bail: |
4642 | set_file_offset(f, z->page_start); |
4643 | return 0; |
4644 | } |
4645 | |
4646 | static int vorbis_seek_frame_from_page(stb_vorbis *f, uint32 page_start, uint32 first_sample, uint32 target_sample, int fine) |
4647 | { |
4648 | int left_start, left_end, right_start, right_end, mode,i; |
4649 | int frame=0; |
4650 | uint32 frame_start; |
4651 | int frames_to_skip, data_to_skip; |
4652 | |
4653 | // first_sample is the sample # of the first sample that doesn't |
4654 | // overlap the previous page... note that this requires us to |
4655 | // _partially_ discard the first packet! bleh. |
4656 | set_file_offset(f, page_start); |
4657 | |
4658 | f->next_seg = -1; // force page resync |
4659 | |
4660 | frame_start = first_sample; |
4661 | // frame start is where the previous packet's last decoded sample |
4662 | // was, which corresponds to left_end... EXCEPT if the previous |
4663 | // packet was long and this packet is short? Probably a bug here. |
4664 | |
4665 | |
4666 | // now, we can start decoding frames... we'll only FAKE decode them, |
4667 | // until we find the frame that contains our sample; then we'll rewind, |
4668 | // and try again |
4669 | for (;;) { |
4670 | int start; |
4671 | |
4672 | if (!vorbis_decode_initial(f, &left_start, &left_end, &right_start, &right_end, &mode)) |
4673 | return error(f, VORBIS_seek_failed); |
4674 | |
4675 | if (frame == 0) |
4676 | start = left_end; |
4677 | else |
4678 | start = left_start; |
4679 | |
4680 | // the window starts at left_start; the last valid sample we generate |
4681 | // before the next frame's window start is right_start-1 |
4682 | if (target_sample < frame_start + right_start-start) |
4683 | break; |
4684 | |
4685 | flush_packet(f); |
4686 | if (f->eof) |
4687 | return error(f, VORBIS_seek_failed); |
4688 | |
4689 | frame_start += right_start - start; |
4690 | |
4691 | ++frame; |
4692 | } |
4693 | |
4694 | // ok, at this point, the sample we want is contained in frame #'frame' |
4695 | |
4696 | // to decode frame #'frame' normally, we have to decode the |
4697 | // previous frame first... but if it's the FIRST frame of the page |
4698 | // we can't. if it's the first frame, it means it falls in the part |
4699 | // of the first frame that doesn't overlap either of the other frames. |
4700 | // so, if we have to handle that case for the first frame, we might |
4701 | // as well handle it for all of them, so: |
4702 | if (target_sample > frame_start + (left_end - left_start)) { |
4703 | // so what we want to do is go ahead and just immediately decode |
4704 | // this frame, but then make it so the next get_frame_float() uses |
4705 | // this already-decoded data? or do we want to go ahead and rewind, |
4706 | // and leave a flag saying to skip the first N data? let's do that |
4707 | frames_to_skip = frame; // if this is frame #1, skip 1 frame (#0) |
4708 | data_to_skip = left_end - left_start; |
4709 | } else { |
4710 | // otherwise, we want to skip frames 0, 1, 2, ... frame-2 |
4711 | // (which means frame-2+1 total frames) then decode frame-1, |
4712 | // then leave frame pending |
4713 | frames_to_skip = frame - 1; |
4714 | assert(frames_to_skip >= 0)((frames_to_skip >= 0) ? (void)0 : _assert("frames_to_skip >= 0" , "src/siege/internal/stb/stb_vorbis.c", 4714)); |
4715 | data_to_skip = -1; |
4716 | } |
4717 | |
4718 | set_file_offset(f, page_start); |
4719 | f->next_seg = - 1; // force page resync |
4720 | |
4721 | for (i=0; i < frames_to_skip; ++i) { |
4722 | maybe_start_packet(f); |
4723 | flush_packet(f); |
4724 | } |
4725 | |
4726 | if (data_to_skip >= 0) { |
4727 | int i,j,n = f->blocksize_0 >> 1; |
4728 | f->discard_samples_deferred = data_to_skip; |
4729 | for (i=0; i < f->channels; ++i) |
4730 | for (j=0; j < n; ++j) |
4731 | f->previous_window[i][j] = 0; |
4732 | f->previous_length = n; |
4733 | frame_start += data_to_skip; |
4734 | } else { |
4735 | f->previous_length = 0; |
4736 | vorbis_pump_first_frame(f); |
4737 | } |
4738 | |
4739 | // at this point, the NEXT decoded frame will generate the desired sample |
4740 | if (fine) { |
4741 | // so if we're doing sample accurate streaming, we want to go ahead and decode it! |
4742 | if (target_sample != frame_start) { |
4743 | int n; |
4744 | stb_vorbis_get_frame_float(f, &n, NULL((void*)0)); |
4745 | assert(target_sample > frame_start)((target_sample > frame_start) ? (void)0 : _assert("target_sample > frame_start" , "src/siege/internal/stb/stb_vorbis.c", 4745)); |
4746 | assert(f->channel_buffer_start + (int) (target_sample-frame_start) < f->channel_buffer_end)((f->channel_buffer_start + (int) (target_sample-frame_start ) < f->channel_buffer_end) ? (void)0 : _assert("f->channel_buffer_start + (int) (target_sample-frame_start) < f->channel_buffer_end" , "src/siege/internal/stb/stb_vorbis.c", 4746)); |
4747 | f->channel_buffer_start += (target_sample - frame_start); |
4748 | } |
4749 | } |
4750 | |
4751 | return 0; |
4752 | } |
4753 | |
4754 | static int vorbis_seek_base(stb_vorbis *f, unsigned int sample_number, int fine) |
4755 | { |
4756 | ProbedPage p[2],q; |
4757 | if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); |
4758 | |
4759 | // do we know the location of the last page? |
4760 | if (f->p_last.page_start == 0) { |
4761 | uint32 z = stb_vorbis_stream_length_in_samples(f); |
4762 | if (z == 0) return error(f, VORBIS_cant_find_last_page); |
4763 | } |
4764 | |
4765 | p[0] = f->p_first; |
4766 | p[1] = f->p_last; |
4767 | |
4768 | if (sample_number >= f->p_last.last_decoded_sample) |
4769 | sample_number = f->p_last.last_decoded_sample-1; |
4770 | |
4771 | if (sample_number < f->p_first.last_decoded_sample) { |
4772 | vorbis_seek_frame_from_page(f, p[0].page_start, 0, sample_number, fine); |
4773 | return 0; |
4774 | } else { |
4775 | int attempts=0; |
4776 | while (p[0].page_end < p[1].page_start) { |
4777 | uint32 probe; |
4778 | uint32 start_offset, end_offset; |
4779 | uint32 start_sample, end_sample; |
4780 | |
4781 | // copy these into local variables so we can tweak them |
4782 | // if any are unknown |
4783 | start_offset = p[0].page_end; |
4784 | end_offset = p[1].after_previous_page_start; // an address known to seek to page p[1] |
4785 | start_sample = p[0].last_decoded_sample; |
4786 | end_sample = p[1].last_decoded_sample; |
4787 | |
4788 | // currently there is no such tweaking logic needed/possible? |
4789 | if (start_sample == SAMPLE_unknown0xffffffff || end_sample == SAMPLE_unknown0xffffffff) |
4790 | return error(f, VORBIS_seek_failed); |
4791 | |
4792 | // now we want to lerp between these for the target samples... |
4793 | |
4794 | // step 1: we need to bias towards the page start... |
4795 | if (start_offset + 4000 < end_offset) |
4796 | end_offset -= 4000; |
4797 | |
4798 | // now compute an interpolated search loc |
4799 | probe = start_offset + (int) floor((float) (end_offset - start_offset) / (end_sample - start_sample) * (sample_number - start_sample)); |
4800 | |
4801 | // next we need to bias towards binary search... |
4802 | // code is a little wonky to allow for full 32-bit unsigned values |
4803 | if (attempts >= 4) { |
4804 | uint32 probe2 = start_offset + ((end_offset - start_offset) >> 1); |
4805 | if (attempts >= 8) |
4806 | probe = probe2; |
4807 | else if (probe < probe2) |
4808 | probe = probe + ((probe2 - probe) >> 1); |
4809 | else |
4810 | probe = probe2 + ((probe - probe2) >> 1); |
4811 | } |
4812 | ++attempts; |
4813 | |
4814 | set_file_offset(f, probe); |
4815 | if (!vorbis_find_page(f, NULL((void*)0), NULL((void*)0))) return error(f, VORBIS_seek_failed); |
4816 | if (!vorbis_analyze_page(f, &q)) return error(f, VORBIS_seek_failed); |
4817 | q.after_previous_page_start = probe; |
4818 | |
4819 | // it's possible we've just found the last page again |
4820 | if (q.page_start == p[1].page_start) { |
4821 | p[1] = q; |
4822 | continue; |
4823 | } |
4824 | |
4825 | if (sample_number < q.last_decoded_sample) |
4826 | p[1] = q; |
4827 | else |
4828 | p[0] = q; |
4829 | } |
4830 | |
4831 | if (p[0].last_decoded_sample <= sample_number && sample_number < p[1].last_decoded_sample) { |
4832 | vorbis_seek_frame_from_page(f, p[1].page_start, p[0].last_decoded_sample, sample_number, fine); |
4833 | return 0; |
4834 | } |
4835 | return error(f, VORBIS_seek_failed); |
4836 | } |
4837 | } |
4838 | |
4839 | int stb_vorbis_seek_frame(stb_vorbis *f, unsigned int sample_number) |
4840 | { |
4841 | return vorbis_seek_base(f, sample_number, FALSE0); |
4842 | } |
4843 | |
4844 | int stb_vorbis_seek(stb_vorbis *f, unsigned int sample_number) |
4845 | { |
4846 | return vorbis_seek_base(f, sample_number, TRUE1); |
4847 | } |
4848 | |
4849 | void stb_vorbis_seek_start(stb_vorbis *f) |
4850 | { |
4851 | if (IS_PUSH_MODE(f)((f)->push_mode)) { error(f, VORBIS_invalid_api_mixing); return; } |
4852 | set_file_offset(f, f->first_audio_page_offset); |
4853 | f->previous_length = 0; |
4854 | f->first_decode = TRUE1; |
4855 | f->next_seg = -1; |
4856 | vorbis_pump_first_frame(f); |
4857 | } |
4858 | |
4859 | unsigned int stb_vorbis_stream_length_in_samples(stb_vorbis *f) |
4860 | { |
4861 | unsigned int restore_offset, previous_safe; |
4862 | unsigned int end, last_page_loc; |
4863 | |
4864 | if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); |
4865 | if (!f->total_samples) { |
4866 | int last; |
4867 | uint32 lo,hi; |
4868 | char header[6]; |
4869 | |
4870 | // first, store the current decode position so we can restore it |
4871 | restore_offset = stb_vorbis_get_file_offset(f); |
4872 | |
4873 | // now we want to seek back 64K from the end (the last page must |
4874 | // be at most a little less than 64K, but let's allow a little slop) |
4875 | if (f->stream_len >= 65536 && f->stream_len-65536 >= f->first_audio_page_offset) |
4876 | previous_safe = f->stream_len - 65536; |
4877 | else |
4878 | previous_safe = f->first_audio_page_offset; |
4879 | |
4880 | set_file_offset(f, previous_safe); |
4881 | // previous_safe is now our candidate 'earliest known place that seeking |
4882 | // to will lead to the final page' |
4883 | |
4884 | if (!vorbis_find_page(f, &end, (int unsigned *)&last)) { |
4885 | // if we can't find a page, we're hosed! |
4886 | f->error = VORBIS_cant_find_last_page; |
4887 | f->total_samples = 0xffffffff; |
4888 | goto done; |
4889 | } |
4890 | |
4891 | // check if there are more pages |
4892 | last_page_loc = stb_vorbis_get_file_offset(f); |
4893 | |
4894 | // stop when the last_page flag is set, not when we reach eof; |
4895 | // this allows us to stop short of a 'file_section' end without |
4896 | // explicitly checking the length of the section |
4897 | while (!last) { |
4898 | set_file_offset(f, end); |
4899 | if (!vorbis_find_page(f, &end, (int unsigned *)&last)) { |
4900 | // the last page we found didn't have the 'last page' flag |
4901 | // set. whoops! |
4902 | break; |
4903 | } |
4904 | previous_safe = last_page_loc+1; |
4905 | last_page_loc = stb_vorbis_get_file_offset(f); |
4906 | } |
4907 | |
4908 | set_file_offset(f, last_page_loc); |
4909 | |
4910 | // parse the header |
4911 | getn(f, (unsigned char *)header, 6); |
4912 | // extract the absolute granule position |
4913 | lo = get32(f); |
4914 | hi = get32(f); |
4915 | if (lo == 0xffffffff && hi == 0xffffffff) { |
4916 | f->error = VORBIS_cant_find_last_page; |
4917 | f->total_samples = SAMPLE_unknown0xffffffff; |
4918 | goto done; |
4919 | } |
4920 | if (hi) |
4921 | lo = 0xfffffffe; // saturate |
4922 | f->total_samples = lo; |
4923 | |
4924 | f->p_last.page_start = last_page_loc; |
4925 | f->p_last.page_end = end; |
4926 | f->p_last.last_decoded_sample = lo; |
4927 | f->p_last.first_decoded_sample = SAMPLE_unknown0xffffffff; |
4928 | f->p_last.after_previous_page_start = previous_safe; |
4929 | |
4930 | done: |
4931 | set_file_offset(f, restore_offset); |
4932 | } |
4933 | return f->total_samples == SAMPLE_unknown0xffffffff ? 0 : f->total_samples; |
4934 | } |
4935 | |
4936 | float stb_vorbis_stream_length_in_seconds(stb_vorbis *f) |
4937 | { |
4938 | return stb_vorbis_stream_length_in_samples(f) / (float) f->sample_rate; |
4939 | } |
4940 | |
4941 | |
4942 | |
4943 | int stb_vorbis_get_frame_float(stb_vorbis *f, int *channels, float ***output) |
4944 | { |
4945 | int len, right,left,i; |
4946 | if (IS_PUSH_MODE(f)((f)->push_mode)) return error(f, VORBIS_invalid_api_mixing); |
4947 | |
4948 | if (!vorbis_decode_packet(f, &len, &left, &right)) { |
4949 | f->channel_buffer_start = f->channel_buffer_end = 0; |
4950 | return 0; |
4951 | } |
4952 | |
4953 | len = vorbis_finish_frame(f, len, left, right); |
4954 | for (i=0; i < f->channels; ++i) |
4955 | f->outputs[i] = f->channel_buffers[i] + left; |
4956 | |
4957 | f->channel_buffer_start = left; |
4958 | f->channel_buffer_end = left+len; |
4959 | |
4960 | if (channels) *channels = f->channels; |
4961 | if (output) *output = f->outputs; |
4962 | return len; |
4963 | } |
4964 | |
4965 | #ifndef STB_VORBIS_NO_STDIO |
4966 | |
4967 | stb_vorbis * stb_vorbis_open_file_section(FILE *file, int close_on_free, int *error, stb_vorbis_alloc *alloc, unsigned int length) |
4968 | { |
4969 | stb_vorbis *f, p; |
4970 | vorbis_init(&p, alloc); |
4971 | p.f = file; |
4972 | p.f_start = ftell(file); |
4973 | p.stream_len = length; |
4974 | p.close_on_free = close_on_free; |
4975 | if (start_decoder(&p)) { |
4976 | f = vorbis_alloc(&p); |
4977 | if (f) { |
4978 | *f = p; |
4979 | vorbis_pump_first_frame(f); |
4980 | return f; |
4981 | } |
4982 | } |
4983 | if (error) *error = p.error; |
4984 | vorbis_deinit(&p); |
4985 | return NULL((void*)0); |
4986 | } |
4987 | |
4988 | stb_vorbis * stb_vorbis_open_file(FILE *file, int close_on_free, int *error, stb_vorbis_alloc *alloc) |
4989 | { |
4990 | unsigned int len, start; |
4991 | start = ftell(file); |
4992 | fseek(file, 0, SEEK_END2); |
4993 | len = ftell(file) - start; |
4994 | fseek(file, start, SEEK_SET0); |
4995 | return stb_vorbis_open_file_section(file, close_on_free, error, alloc, len); |
4996 | } |
4997 | |
4998 | stb_vorbis * stb_vorbis_open_filename(char *filename, int *error, stb_vorbis_alloc *alloc) |
4999 | { |
5000 | FILE *f = fopen(filename, "rb"); |
5001 | if (f) |
5002 | return stb_vorbis_open_file(f, TRUE1, error, alloc); |
5003 | if (error) *error = VORBIS_file_open_failure; |
5004 | return NULL((void*)0); |
5005 | } |
5006 | #endif // STB_VORBIS_NO_STDIO |
5007 | |
5008 | stb_vorbis * stb_vorbis_open_memory(unsigned char *data, int len, int *error, stb_vorbis_alloc *alloc) |
5009 | { |
5010 | stb_vorbis *f, p; |
5011 | if (data == NULL((void*)0)) return NULL((void*)0); |
5012 | vorbis_init(&p, alloc); |
5013 | p.stream = data; |
5014 | p.stream_end = data + len; |
5015 | p.stream_start = p.stream; |
5016 | p.stream_len = len; |
5017 | p.push_mode = FALSE0; |
5018 | if (start_decoder(&p)) { |
5019 | f = vorbis_alloc(&p); |
5020 | if (f) { |
5021 | *f = p; |
5022 | vorbis_pump_first_frame(f); |
5023 | return f; |
5024 | } |
5025 | } |
5026 | if (error) *error = p.error; |
5027 | vorbis_deinit(&p); |
5028 | return NULL((void*)0); |
5029 | } |
5030 | |
5031 | #ifndef STB_VORBIS_NO_INTEGER_CONVERSION |
5032 | #define PLAYBACK_MONO1 1 |
5033 | #define PLAYBACK_LEFT2 2 |
5034 | #define PLAYBACK_RIGHT4 4 |
5035 | |
5036 | #define L(2 | 1) (PLAYBACK_LEFT2 | PLAYBACK_MONO1) |
5037 | #define C(2 | 4 | 1) (PLAYBACK_LEFT2 | PLAYBACK_RIGHT4 | PLAYBACK_MONO1) |
5038 | #define R(4 | 1) (PLAYBACK_RIGHT4 | PLAYBACK_MONO1) |
5039 | |
5040 | static int8 channel_position[7][6] = |
5041 | { |
5042 | { 0 }, |
5043 | { C(2 | 4 | 1) }, |
5044 | { L(2 | 1), R(4 | 1) }, |
5045 | { L(2 | 1), C(2 | 4 | 1), R(4 | 1) }, |
5046 | { L(2 | 1), R(4 | 1), L(2 | 1), R(4 | 1) }, |
5047 | { L(2 | 1), C(2 | 4 | 1), R(4 | 1), L(2 | 1), R(4 | 1) }, |
5048 | { L(2 | 1), C(2 | 4 | 1), R(4 | 1), L(2 | 1), R(4 | 1), C(2 | 4 | 1) }, |
5049 | }; |
5050 | |
5051 | |
5052 | #ifndef STB_VORBIS_NO_FAST_SCALED_FLOAT |
5053 | typedef union { |
5054 | float f; |
5055 | int i; |
5056 | } float_conv; |
5057 | typedef char stb_vorbis_float_size_test[sizeof(float)==4 && sizeof(int) == 4]; |
5058 | #define FASTDEF(x)float_conv x float_conv x |
5059 | // add (1<<23) to convert to int, then divide by 2^SHIFT, then add 0.5/2^SHIFT to round |
5060 | #define MAGIC(SHIFT)(1.5f * (1 << (23-SHIFT)) + 0.5f/(1 << SHIFT)) (1.5f * (1 << (23-SHIFT)) + 0.5f/(1 << SHIFT)) |
5061 | #define ADDEND(SHIFT)(((150-SHIFT) << 23) + (1 << 22)) (((150-SHIFT) << 23) + (1 << 22)) |
5062 | #define FAST_SCALED_FLOAT_TO_INT(temp,x,s)(temp.f = (x) + (1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - (((150-s) << 23) + (1 << 22))) (temp.f = (x) + MAGIC(s)(1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - ADDEND(s)(((150-s) << 23) + (1 << 22))) |
5063 | #define check_endianness() |
5064 | #else |
5065 | #define FAST_SCALED_FLOAT_TO_INT(temp,x,s)(temp.f = (x) + (1.5f * (1 << (23-s)) + 0.5f/(1 << s)), temp.i - (((150-s) << 23) + (1 << 22))) ((int) ((x) * (1 << (s)))) |
5066 | #define check_endianness() |
5067 | #define FASTDEF(x)float_conv x |
5068 | #endif |
5069 | |
5070 | static void copy_samples(short *dest, float *src, int len) |
5071 | { |
5072 | int i; |
5073 | check_endianness(); |
5074 | for (i=0; i < len; ++i) { |
5075 | FASTDEF(temp)float_conv temp; |
5076 | int v = FAST_SCALED_FLOAT_TO_INT(temp, src[i],15)(temp.f = (src[i]) + (1.5f * (1 << (23-15)) + 0.5f/(1 << 15)), temp.i - (((150-15) << 23) + (1 << 22))); |
5077 | if ((unsigned int) (v + 32768) > 65535) |
5078 | v = v < 0 ? -32768 : 32767; |
5079 | dest[i] = v; |
5080 | } |
5081 | } |
5082 | |
5083 | static void compute_samples(int mask, short *output, int num_c, float **data, int d_offset, int len) |
5084 | { |
5085 | #define BUFFER_SIZE32 32 |
5086 | float buffer[BUFFER_SIZE32]; |
5087 | int i,j,o,n = BUFFER_SIZE32; |
5088 | check_endianness(); |
5089 | for (o = 0; o < len; o += BUFFER_SIZE32) { |
5090 | memset(buffer, 0, sizeof(buffer)); |
5091 | if (o + n > len) n = len - o; |
5092 | for (j=0; j < num_c; ++j) { |
5093 | if (channel_position[num_c][j] & mask) { |
5094 | for (i=0; i < n; ++i) |
5095 | buffer[i] += data[j][d_offset+o+i]; |
5096 | } |
5097 | } |
5098 | for (i=0; i < n; ++i) { |
5099 | FASTDEF(temp)float_conv temp; |
5100 | int v = FAST_SCALED_FLOAT_TO_INT(temp,buffer[i],15)(temp.f = (buffer[i]) + (1.5f * (1 << (23-15)) + 0.5f/( 1 << 15)), temp.i - (((150-15) << 23) + (1 << 22))); |
5101 | if ((unsigned int) (v + 32768) > 65535) |
5102 | v = v < 0 ? -32768 : 32767; |
5103 | output[o+i] = v; |
5104 | } |
5105 | } |
5106 | } |
5107 | |
5108 | static int channel_selector[3][2] = { {0}, {PLAYBACK_MONO1}, {PLAYBACK_LEFT2, PLAYBACK_RIGHT4} }; |
5109 | static void compute_stereo_samples(short *output, int num_c, float **data, int d_offset, int len) |
5110 | { |
5111 | #define BUFFER_SIZE32 32 |
5112 | float buffer[BUFFER_SIZE32]; |
5113 | int i,j,o,n = BUFFER_SIZE32 >> 1; |
5114 | // o is the offset in the source data |
5115 | check_endianness(); |
5116 | for (o = 0; o < len; o += BUFFER_SIZE32 >> 1) { |
5117 | // o2 is the offset in the output data |
5118 | int o2 = o << 1; |
5119 | memset(buffer, 0, sizeof(buffer)); |
5120 | if (o + n > len) n = len - o; |
5121 | for (j=0; j < num_c; ++j) { |
5122 | int m = channel_position[num_c][j] & (PLAYBACK_LEFT2 | PLAYBACK_RIGHT4); |
5123 | if (m == (PLAYBACK_LEFT2 | PLAYBACK_RIGHT4)) { |
5124 | for (i=0; i < n; ++i) { |
5125 | buffer[i*2+0] += data[j][d_offset+o+i]; |
5126 | buffer[i*2+1] += data[j][d_offset+o+i]; |
5127 | } |
5128 | } else if (m == PLAYBACK_LEFT2) { |
5129 | for (i=0; i < n; ++i) { |
5130 | buffer[i*2+0] += data[j][d_offset+o+i]; |
5131 | } |
5132 | } else if (m == PLAYBACK_RIGHT4) { |
5133 | for (i=0; i < n; ++i) { |
5134 | buffer[i*2+1] += data[j][d_offset+o+i]; |
5135 | } |
5136 | } |
5137 | } |
5138 | for (i=0; i < (n<<1); ++i) { |
5139 | FASTDEF(temp)float_conv temp; |
5140 | int v = FAST_SCALED_FLOAT_TO_INT(temp,buffer[i],15)(temp.f = (buffer[i]) + (1.5f * (1 << (23-15)) + 0.5f/( 1 << 15)), temp.i - (((150-15) << 23) + (1 << 22))); |
5141 | if ((unsigned int) (v + 32768) > 65535) |
5142 | v = v < 0 ? -32768 : 32767; |
5143 | output[o2+i] = v; |
5144 | } |
5145 | } |
5146 | } |
5147 | |
5148 | static void convert_samples_short(int buf_c, short **buffer, int b_offset, int data_c, float **data, int d_offset, int samples) |
5149 | { |
5150 | int i; |
5151 | if (buf_c != data_c && buf_c <= 2 && data_c <= 6) { |
5152 | static int channel_selector[3][2] = { {0}, {PLAYBACK_MONO1}, {PLAYBACK_LEFT2, PLAYBACK_RIGHT4} }; |
5153 | for (i=0; i < buf_c; ++i) |
5154 | compute_samples(channel_selector[buf_c][i], buffer[i]+b_offset, data_c, data, d_offset, samples); |
5155 | } else { |
5156 | int limit = buf_c < data_c ? buf_c : data_c; |
5157 | for (i=0; i < limit; ++i) |
5158 | copy_samples(buffer[i]+b_offset, data[i], samples); |
5159 | for ( ; i < buf_c; ++i) |
5160 | memset(buffer[i]+b_offset, 0, sizeof(short) * samples); |
5161 | } |
5162 | } |
5163 | |
5164 | int stb_vorbis_get_frame_short(stb_vorbis *f, int num_c, short **buffer, int num_samples) |
5165 | { |
5166 | float **output; |
5167 | int len = stb_vorbis_get_frame_float(f, NULL((void*)0), &output); |
5168 | if (len > num_samples) len = num_samples; |
5169 | if (len) |
5170 | convert_samples_short(num_c, buffer, 0, f->channels, output, 0, len); |
5171 | return len; |
5172 | } |
5173 | |
5174 | static void convert_channels_short_interleaved(int buf_c, short *buffer, int data_c, float **data, int d_offset, int len) |
5175 | { |
5176 | int i; |
5177 | check_endianness(); |
5178 | if (buf_c != data_c && buf_c <= 2 && data_c <= 6) { |
5179 | assert(buf_c == 2)((buf_c == 2) ? (void)0 : _assert("buf_c == 2", "src/siege/internal/stb/stb_vorbis.c" , 5179)); |
5180 | for (i=0; i < buf_c; ++i) |
5181 | compute_stereo_samples(buffer, data_c, data, d_offset, len); |
5182 | } else { |
5183 | int limit = buf_c < data_c ? buf_c : data_c; |
5184 | int j; |
5185 | for (j=0; j < len; ++j) { |
5186 | for (i=0; i < limit; ++i) { |
5187 | FASTDEF(temp)float_conv temp; |
5188 | float f = data[i][d_offset+j]; |
5189 | int v = FAST_SCALED_FLOAT_TO_INT(temp, f,15)(temp.f = (f) + (1.5f * (1 << (23-15)) + 0.5f/(1 << 15)), temp.i - (((150-15) << 23) + (1 << 22)));//data[i][d_offset+j],15); |
5190 | if ((unsigned int) (v + 32768) > 65535) |
5191 | v = v < 0 ? -32768 : 32767; |
5192 | *buffer++ = v; |
5193 | } |
5194 | for ( ; i < buf_c; ++i) |
5195 | *buffer++ = 0; |
5196 | } |
5197 | } |
5198 | } |
5199 | |
5200 | int stb_vorbis_get_frame_short_interleaved(stb_vorbis *f, int num_c, short *buffer, int num_shorts) |
5201 | { |
5202 | float **output; |
5203 | int len; |
5204 | if (num_c == 1) return stb_vorbis_get_frame_short(f,num_c,&buffer, num_shorts); |
5205 | len = stb_vorbis_get_frame_float(f, NULL((void*)0), &output); |
5206 | if (len) { |
5207 | if (len*num_c > num_shorts) len = num_shorts / num_c; |
5208 | convert_channels_short_interleaved(num_c, buffer, f->channels, output, 0, len); |
5209 | } |
5210 | return len; |
5211 | } |
5212 | |
5213 | int stb_vorbis_get_samples_short_interleaved(stb_vorbis *f, int channels, short *buffer, int num_shorts) |
5214 | { |
5215 | float **outputs; |
5216 | int len = num_shorts / channels; |
5217 | int n=0; |
5218 | int z = f->channels; |
5219 | if (z > channels) z = channels; |
5220 | while (n < len) { |
5221 | int k = f->channel_buffer_end - f->channel_buffer_start; |
5222 | if (n+k >= len) k = len - n; |
5223 | if (k) |
5224 | convert_channels_short_interleaved(channels, buffer, f->channels, f->channel_buffers, f->channel_buffer_start, k); |
5225 | buffer += k*channels; |
5226 | n += k; |
5227 | f->channel_buffer_start += k; |
5228 | if (n == len) break; |
5229 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; |
5230 | } |
5231 | return n; |
5232 | } |
5233 | |
5234 | int stb_vorbis_get_samples_short(stb_vorbis *f, int channels, short **buffer, int len) |
5235 | { |
5236 | float **outputs; |
5237 | int n=0; |
5238 | int z = f->channels; |
5239 | if (z > channels) z = channels; |
Value stored to 'z' is never read | |
5240 | while (n < len) { |
5241 | int k = f->channel_buffer_end - f->channel_buffer_start; |
5242 | if (n+k >= len) k = len - n; |
5243 | if (k) |
5244 | convert_samples_short(channels, buffer, n, f->channels, f->channel_buffers, f->channel_buffer_start, k); |
5245 | n += k; |
5246 | f->channel_buffer_start += k; |
5247 | if (n == len) break; |
5248 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; |
5249 | } |
5250 | return n; |
5251 | } |
5252 | |
5253 | #ifndef STB_VORBIS_NO_STDIO |
5254 | int stb_vorbis_decode_filename(char *filename, int *channels, short **output) |
5255 | { |
5256 | int data_len, offset, total, limit, error; |
5257 | short *data; |
5258 | stb_vorbis *v = stb_vorbis_open_filename(filename, &error, NULL((void*)0)); |
5259 | if (v == NULL((void*)0)) return -1; |
5260 | limit = v->channels * 4096; |
5261 | *channels = v->channels; |
5262 | offset = data_len = 0; |
5263 | total = limit; |
5264 | data = (short *) malloc(total * sizeof(*data)); |
5265 | if (data == NULL((void*)0)) { |
5266 | stb_vorbis_close(v); |
5267 | return -2; |
5268 | } |
5269 | for (;;) { |
5270 | int n = stb_vorbis_get_frame_short_interleaved(v, v->channels, data+offset, total-offset); |
5271 | if (n == 0) break; |
5272 | data_len += n; |
5273 | offset += n * v->channels; |
5274 | if (offset + limit > total) { |
5275 | short *data2; |
5276 | total *= 2; |
5277 | data2 = (short *) realloc(data, total * sizeof(*data)); |
5278 | if (data2 == NULL((void*)0)) { |
5279 | free(data); |
5280 | stb_vorbis_close(v); |
5281 | return -2; |
5282 | } |
5283 | data = data2; |
5284 | } |
5285 | } |
5286 | *output = data; |
5287 | return data_len; |
5288 | } |
5289 | #endif // NO_STDIO |
5290 | |
5291 | int stb_vorbis_decode_memory(uint8 *mem, int len, int *channels, short **output) |
5292 | { |
5293 | int data_len, offset, total, limit, error; |
5294 | short *data; |
5295 | stb_vorbis *v = stb_vorbis_open_memory(mem, len, &error, NULL((void*)0)); |
5296 | if (v == NULL((void*)0)) return -1; |
5297 | limit = v->channels * 4096; |
5298 | *channels = v->channels; |
5299 | offset = data_len = 0; |
5300 | total = limit; |
5301 | data = (short *) malloc(total * sizeof(*data)); |
5302 | if (data == NULL((void*)0)) { |
5303 | stb_vorbis_close(v); |
5304 | return -2; |
5305 | } |
5306 | for (;;) { |
5307 | int n = stb_vorbis_get_frame_short_interleaved(v, v->channels, data+offset, total-offset); |
5308 | if (n == 0) break; |
5309 | data_len += n; |
5310 | offset += n * v->channels; |
5311 | if (offset + limit > total) { |
5312 | short *data2; |
5313 | total *= 2; |
5314 | data2 = (short *) realloc(data, total * sizeof(*data)); |
5315 | if (data2 == NULL((void*)0)) { |
5316 | free(data); |
5317 | stb_vorbis_close(v); |
5318 | return -2; |
5319 | } |
5320 | data = data2; |
5321 | } |
5322 | } |
5323 | *output = data; |
5324 | return data_len; |
5325 | } |
5326 | #endif |
5327 | |
5328 | int stb_vorbis_get_samples_float_interleaved(stb_vorbis *f, int channels, float *buffer, int num_floats) |
5329 | { |
5330 | float **outputs; |
5331 | int len = num_floats / channels; |
5332 | int n=0; |
5333 | int z = f->channels; |
5334 | if (z > channels) z = channels; |
5335 | while (n < len) { |
5336 | int i,j; |
5337 | int k = f->channel_buffer_end - f->channel_buffer_start; |
5338 | if (n+k >= len) k = len - n; |
5339 | for (j=0; j < k; ++j) { |
5340 | for (i=0; i < z; ++i) |
5341 | *buffer++ = f->channel_buffers[i][f->channel_buffer_start+j]; |
5342 | for ( ; i < channels; ++i) |
5343 | *buffer++ = 0; |
5344 | } |
5345 | n += k; |
5346 | f->channel_buffer_start += k; |
5347 | if (n == len) break; |
5348 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; |
5349 | } |
5350 | return n; |
5351 | } |
5352 | |
5353 | int stb_vorbis_get_samples_float(stb_vorbis *f, int channels, float **buffer, int num_samples) |
5354 | { |
5355 | float **outputs; |
5356 | int n=0; |
5357 | int z = f->channels; |
5358 | if (z > channels) z = channels; |
5359 | while (n < num_samples) { |
5360 | int i; |
5361 | int k = f->channel_buffer_end - f->channel_buffer_start; |
5362 | if (n+k >= num_samples) k = num_samples - n; |
5363 | if (k) { |
5364 | for (i=0; i < z; ++i) |
5365 | memcpy(buffer[i]+n, f->channel_buffers+f->channel_buffer_start, sizeof(float)*k); |
5366 | for ( ; i < channels; ++i) |
5367 | memset(buffer[i]+n, 0, sizeof(float) * k); |
5368 | } |
5369 | n += k; |
5370 | f->channel_buffer_start += k; |
5371 | if (n == num_samples) break; |
5372 | if (!stb_vorbis_get_frame_float(f, NULL((void*)0), &outputs)) break; |
5373 | } |
5374 | return n; |
5375 | } |
5376 | #endif // STB_VORBIS_NO_PULLDATA_API |
5377 | |
5378 | void _dummyFunction(void) |
5379 | { |
5380 | (void)get_bits_signed; |
5381 | (void)codebook_decode_scalar; |
5382 | (void)channel_selector; |
5383 | } |
5384 | |
5385 | #endif // STB_VORBIS_HEADER_ONLY |