- speed up decoding
- CFLAGS cleanup
This commit is contained in:
parent
330b9804c0
commit
66a59af0bd
@ -20,18 +20,17 @@ diff -up flac-1.2.1/src/libFLAC/ia32/lpc_asm.nasm.asm flac-1.2.1/src/libFLAC/ia3
|
||||
- section .note.GNU-stack noalloc
|
||||
+ section .note.GNU-stack progbits noalloc noexec nowrite align=1
|
||||
%endif
|
||||
diff -up flac-1.2.1/src/libFLAC/ia32/Makefile.in.asm flac-1.2.1/src/libFLAC/ia32/Makefile.in
|
||||
--- flac-1.2.1/src/libFLAC/ia32/Makefile.in.asm 2007-09-16 22:05:12.000000000 +0200
|
||||
+++ flac-1.2.1/src/libFLAC/ia32/Makefile.in 2008-01-29 10:32:17.000000000 +0100
|
||||
@@ -254,7 +254,7 @@ LTLIBRARIES = $(noinst_LTLIBRARIES)
|
||||
|
||||
libFLAC_asm_la_LDFLAGS =
|
||||
libFLAC_asm_la_LIBADD =
|
||||
-am_libFLAC_asm_la_OBJECTS = bitreader_asm.lo cpu_asm.lo fixed_asm.lo \
|
||||
+am_libFLAC_asm_la_OBJECTS = cpu_asm.lo fixed_asm.lo \
|
||||
lpc_asm.lo stream_encoder_asm.lo
|
||||
libFLAC_asm_la_OBJECTS = $(am_libFLAC_asm_la_OBJECTS)
|
||||
diff -up flac-1.2.1/src/libFLAC/ia32/Makefile.am.asm flac-1.2.1/src/libFLAC/ia32/Makefile.am
|
||||
--- flac-1.2.1/src/libFLAC/ia32/Makefile.am.asm 2007-04-04 02:01:13.000000000 +0200
|
||||
+++ flac-1.2.1/src/libFLAC/ia32/Makefile.am 2008-03-17 14:04:37.000000000 +0100
|
||||
@@ -37,7 +37,6 @@ STRIP_NON_ASM = sh $(top_srcdir)/strip_n
|
||||
|
||||
noinst_LTLIBRARIES = libFLAC-asm.la
|
||||
libFLAC_asm_la_SOURCES = \
|
||||
- bitreader_asm.nasm \
|
||||
cpu_asm.nasm \
|
||||
fixed_asm.nasm \
|
||||
lpc_asm.nasm \
|
||||
diff -up flac-1.2.1/src/libFLAC/ia32/bitreader_asm.nasm.asm flac-1.2.1/src/libFLAC/ia32/bitreader_asm.nasm
|
||||
--- flac-1.2.1/src/libFLAC/ia32/bitreader_asm.nasm.asm 2007-03-30 02:54:53.000000000 +0200
|
||||
+++ flac-1.2.1/src/libFLAC/ia32/bitreader_asm.nasm 2008-01-29 10:32:57.000000000 +0100
|
||||
|
558
flac-1.2.1-bitreader.patch
Normal file
558
flac-1.2.1-bitreader.patch
Normal file
@ -0,0 +1,558 @@
|
||||
Index: src/libFLAC/bitreader.c
|
||||
===================================================================
|
||||
RCS file: /cvsroot/flac/flac/src/libFLAC/bitreader.c,v
|
||||
retrieving revision 1.15
|
||||
diff -u -r1.15 bitreader.c
|
||||
--- src/libFLAC/bitreader.c 28 Feb 2008 05:34:26 -0000 1.15
|
||||
+++ src/libFLAC/bitreader.c 14 Mar 2008 11:07:07 -0000
|
||||
@@ -69,13 +69,12 @@
|
||||
#endif
|
||||
/* counts the # of zero MSBs in a word */
|
||||
#define COUNT_ZERO_MSBS(word) ( \
|
||||
- (word) <= 0xffff ? \
|
||||
- ( (word) <= 0xff? byte_to_unary_table[word] + 24 : byte_to_unary_table[(word) >> 8] + 16 ) : \
|
||||
- ( (word) <= 0xffffff? byte_to_unary_table[word >> 16] + 8 : byte_to_unary_table[(word) >> 24] ) \
|
||||
+ word > 0xffffff ? byte_to_unary_table[(word) >> 24] : \
|
||||
+ !word ? 32 : \
|
||||
+ word > 0xffff ? byte_to_unary_table[word >> 16] + 8 : \
|
||||
+ word > 0xff ? byte_to_unary_table[(word) >> 8] + 16 : \
|
||||
+ byte_to_unary_table[word] + 24 \
|
||||
)
|
||||
-/* this alternate might be slightly faster on some systems/compilers: */
|
||||
-#define COUNT_ZERO_MSBS2(word) ( (word) <= 0xff ? byte_to_unary_table[word] + 24 : ((word) <= 0xffff ? byte_to_unary_table[(word) >> 8] + 16 : ((word) <= 0xffffff ? byte_to_unary_table[(word) >> 16] + 8 : byte_to_unary_table[(word) >> 24])) )
|
||||
-
|
||||
|
||||
/*
|
||||
* This should be at least twice as large as the largest number of words
|
||||
Index: src/libFLAC/bitreader.c
|
||||
===================================================================
|
||||
RCS file: /cvsroot/flac/flac/src/libFLAC/bitreader.c,v
|
||||
retrieving revision 1.15
|
||||
diff -u -r1.15 bitreader.c
|
||||
--- src/libFLAC/bitreader.c 28 Feb 2008 05:34:26 -0000 1.15
|
||||
+++ src/libFLAC/bitreader.c 14 Mar 2008 13:19:46 -0000
|
||||
@@ -149,6 +148,7 @@
|
||||
FLAC__CPUInfo cpu_info;
|
||||
};
|
||||
|
||||
+#if FLAC__BYTES_PER_WORD == 4 && FLAC__CPU_IA32
|
||||
#ifdef _MSC_VER
|
||||
/* OPT: an MSVC built-in would be better */
|
||||
static _inline FLAC__uint32 local_swap32_(FLAC__uint32 x)
|
||||
@@ -173,6 +173,15 @@
|
||||
done1:
|
||||
}
|
||||
}
|
||||
+#elif __GNUC__
|
||||
+static void local_swap32_block_(FLAC__uint32 *start, FLAC__uint32 len)
|
||||
+{
|
||||
+ FLAC__uint32 *end;
|
||||
+
|
||||
+ for(end = start + len; start < end; start++)
|
||||
+ asm ("bswap %0" : "=r"(*start) : "0"(*start));
|
||||
+}
|
||||
+#endif
|
||||
#endif
|
||||
|
||||
static FLaC__INLINE void crc16_update_word_(FLAC__BitReader *br, brword word)
|
||||
@@ -263,7 +272,7 @@
|
||||
#if WORDS_BIGENDIAN
|
||||
#else
|
||||
end = (br->words*FLAC__BYTES_PER_WORD + br->bytes + bytes + (FLAC__BYTES_PER_WORD-1)) / FLAC__BYTES_PER_WORD;
|
||||
-# if defined(_MSC_VER) && (FLAC__BYTES_PER_WORD == 4)
|
||||
+# if FLAC__CPU_IA32 && (__GNUC__ || defined(_MSC_VER)) && FLAC__BYTES_PER_WORD == 4
|
||||
if(br->cpu_info.type == FLAC__CPUINFO_TYPE_IA32 && br->cpu_info.data.ia32.bswap) {
|
||||
start = br->words;
|
||||
local_swap32_block_(br->buffer + start, end - start);
|
||||
Index: src/libFLAC/bitreader.c
|
||||
===================================================================
|
||||
RCS file: /cvsroot/flac/flac/src/libFLAC/bitreader.c,v
|
||||
retrieving revision 1.15
|
||||
diff -u -r1.15 bitreader.c
|
||||
--- src/libFLAC/bitreader.c 28 Feb 2008 05:34:26 -0000 1.15
|
||||
+++ src/libFLAC/bitreader.c 17 Mar 2008 15:42:57 -0000
|
||||
@@ -803,379 +812,144 @@
|
||||
}
|
||||
|
||||
/* this is by far the most heavily used reader call. it ain't pretty but it's fast */
|
||||
-/* a lot of the logic is copied, then adapted, from FLAC__bitreader_read_unary_unsigned() and FLAC__bitreader_read_raw_uint32() */
|
||||
FLAC__bool FLAC__bitreader_read_rice_signed_block(FLAC__BitReader *br, int vals[], unsigned nvals, unsigned parameter)
|
||||
-/* OPT: possibly faster version for use with MSVC */
|
||||
-#ifdef _MSC_VER
|
||||
{
|
||||
- unsigned i;
|
||||
- unsigned uval = 0;
|
||||
- unsigned bits; /* the # of binary LSBs left to read to finish a rice codeword */
|
||||
-
|
||||
/* try and get br->consumed_words and br->consumed_bits into register;
|
||||
* must remember to flush them back to *br before calling other
|
||||
- * bitwriter functions that use them, and before returning */
|
||||
- register unsigned cwords;
|
||||
- register unsigned cbits;
|
||||
+ * bitreader functions that use them, and before returning */
|
||||
+ unsigned cwords, words, lsbs, msbs, x, y;
|
||||
+ unsigned ucbits; /* keep track of the number of unconsumed bits in word */
|
||||
+ brword b;
|
||||
+ int *val, *end;
|
||||
|
||||
FLAC__ASSERT(0 != br);
|
||||
FLAC__ASSERT(0 != br->buffer);
|
||||
/* WATCHOUT: code does not work with <32bit words; we can make things much faster with this assertion */
|
||||
FLAC__ASSERT(FLAC__BITS_PER_WORD >= 32);
|
||||
FLAC__ASSERT(parameter < 32);
|
||||
- /* the above two asserts also guarantee that the binary part never straddles more that 2 words, so we don't have to loop to read it */
|
||||
-
|
||||
- if(nvals == 0)
|
||||
- return true;
|
||||
-
|
||||
- cbits = br->consumed_bits;
|
||||
- cwords = br->consumed_words;
|
||||
+ /* the above two asserts also guarantee that the binary part never straddles more than 2 words, so we don't have to loop to read it */
|
||||
|
||||
- while(1) {
|
||||
+ val = vals;
|
||||
+ end = vals + nvals;
|
||||
|
||||
- /* read unary part */
|
||||
- while(1) {
|
||||
- while(cwords < br->words) { /* if we've not consumed up to a partial tail word... */
|
||||
- brword b = br->buffer[cwords] << cbits;
|
||||
- if(b) {
|
||||
-#if 0 /* slower, probably due to bad register allocation... */ && defined FLAC__CPU_IA32 && !defined FLAC__NO_ASM && FLAC__BITS_PER_WORD == 32
|
||||
- __asm {
|
||||
- bsr eax, b
|
||||
- not eax
|
||||
- and eax, 31
|
||||
- mov i, eax
|
||||
- }
|
||||
-#else
|
||||
- i = COUNT_ZERO_MSBS(b);
|
||||
-#endif
|
||||
- uval += i;
|
||||
- bits = parameter;
|
||||
- i++;
|
||||
- cbits += i;
|
||||
- if(cbits == FLAC__BITS_PER_WORD) {
|
||||
- crc16_update_word_(br, br->buffer[cwords]);
|
||||
- cwords++;
|
||||
- cbits = 0;
|
||||
- }
|
||||
- goto break1;
|
||||
- }
|
||||
- else {
|
||||
- uval += FLAC__BITS_PER_WORD - cbits;
|
||||
- crc16_update_word_(br, br->buffer[cwords]);
|
||||
- cwords++;
|
||||
- cbits = 0;
|
||||
- /* didn't find stop bit yet, have to keep going... */
|
||||
- }
|
||||
- }
|
||||
- /* at this point we've eaten up all the whole words; have to try
|
||||
- * reading through any tail bytes before calling the read callback.
|
||||
- * this is a repeat of the above logic adjusted for the fact we
|
||||
- * don't have a whole word. note though if the client is feeding
|
||||
- * us data a byte at a time (unlikely), br->consumed_bits may not
|
||||
- * be zero.
|
||||
- */
|
||||
- if(br->bytes) {
|
||||
- const unsigned end = br->bytes * 8;
|
||||
- brword b = (br->buffer[cwords] & (FLAC__WORD_ALL_ONES << (FLAC__BITS_PER_WORD-end))) << cbits;
|
||||
- if(b) {
|
||||
- i = COUNT_ZERO_MSBS(b);
|
||||
- uval += i;
|
||||
- bits = parameter;
|
||||
- i++;
|
||||
- cbits += i;
|
||||
- FLAC__ASSERT(cbits < FLAC__BITS_PER_WORD);
|
||||
- goto break1;
|
||||
- }
|
||||
- else {
|
||||
- uval += end - cbits;
|
||||
- cbits += end;
|
||||
- FLAC__ASSERT(cbits < FLAC__BITS_PER_WORD);
|
||||
- /* didn't find stop bit yet, have to keep going... */
|
||||
- }
|
||||
- }
|
||||
- /* flush registers and read; bitreader_read_from_client_() does
|
||||
- * not touch br->consumed_bits at all but we still need to set
|
||||
- * it in case it fails and we have to return false.
|
||||
- */
|
||||
- br->consumed_bits = cbits;
|
||||
- br->consumed_words = cwords;
|
||||
- if(!bitreader_read_from_client_(br))
|
||||
+ if(parameter == 0) {
|
||||
+ while(val < end) {
|
||||
+ /* read the unary MSBs and end bit */
|
||||
+ if(!FLAC__bitreader_read_unary_unsigned(br, &msbs))
|
||||
return false;
|
||||
- cwords = br->consumed_words;
|
||||
- }
|
||||
-break1:
|
||||
- /* read binary part */
|
||||
- FLAC__ASSERT(cwords <= br->words);
|
||||
-
|
||||
- if(bits) {
|
||||
- while((br->words-cwords)*FLAC__BITS_PER_WORD + br->bytes*8 - cbits < bits) {
|
||||
- /* flush registers and read; bitreader_read_from_client_() does
|
||||
- * not touch br->consumed_bits at all but we still need to set
|
||||
- * it in case it fails and we have to return false.
|
||||
- */
|
||||
- br->consumed_bits = cbits;
|
||||
- br->consumed_words = cwords;
|
||||
- if(!bitreader_read_from_client_(br))
|
||||
- return false;
|
||||
- cwords = br->consumed_words;
|
||||
- }
|
||||
- if(cwords < br->words) { /* if we've not consumed up to a partial tail word... */
|
||||
- if(cbits) {
|
||||
- /* this also works when consumed_bits==0, it's just a little slower than necessary for that case */
|
||||
- const unsigned n = FLAC__BITS_PER_WORD - cbits;
|
||||
- const brword word = br->buffer[cwords];
|
||||
- if(bits < n) {
|
||||
- uval <<= bits;
|
||||
- uval |= (word & (FLAC__WORD_ALL_ONES >> cbits)) >> (n-bits);
|
||||
- cbits += bits;
|
||||
- goto break2;
|
||||
- }
|
||||
- uval <<= n;
|
||||
- uval |= word & (FLAC__WORD_ALL_ONES >> cbits);
|
||||
- bits -= n;
|
||||
- crc16_update_word_(br, word);
|
||||
- cwords++;
|
||||
- cbits = 0;
|
||||
- if(bits) { /* if there are still bits left to read, there have to be less than 32 so they will all be in the next word */
|
||||
- uval <<= bits;
|
||||
- uval |= (br->buffer[cwords] >> (FLAC__BITS_PER_WORD-bits));
|
||||
- cbits = bits;
|
||||
- }
|
||||
- goto break2;
|
||||
- }
|
||||
- else {
|
||||
- FLAC__ASSERT(bits < FLAC__BITS_PER_WORD);
|
||||
- uval <<= bits;
|
||||
- uval |= br->buffer[cwords] >> (FLAC__BITS_PER_WORD-bits);
|
||||
- cbits = bits;
|
||||
- goto break2;
|
||||
- }
|
||||
- }
|
||||
- else {
|
||||
- /* in this case we're starting our read at a partial tail word;
|
||||
- * the reader has guaranteed that we have at least 'bits' bits
|
||||
- * available to read, which makes this case simpler.
|
||||
- */
|
||||
- uval <<= bits;
|
||||
- if(cbits) {
|
||||
- /* this also works when consumed_bits==0, it's just a little slower than necessary for that case */
|
||||
- FLAC__ASSERT(cbits + bits <= br->bytes*8);
|
||||
- uval |= (br->buffer[cwords] & (FLAC__WORD_ALL_ONES >> cbits)) >> (FLAC__BITS_PER_WORD-cbits-bits);
|
||||
- cbits += bits;
|
||||
- goto break2;
|
||||
- }
|
||||
- else {
|
||||
- uval |= br->buffer[cwords] >> (FLAC__BITS_PER_WORD-bits);
|
||||
- cbits += bits;
|
||||
- goto break2;
|
||||
- }
|
||||
- }
|
||||
- }
|
||||
-break2:
|
||||
- /* compose the value */
|
||||
- *vals = (int)(uval >> 1 ^ -(int)(uval & 1));
|
||||
|
||||
- /* are we done? */
|
||||
- --nvals;
|
||||
- if(nvals == 0) {
|
||||
- br->consumed_bits = cbits;
|
||||
- br->consumed_words = cwords;
|
||||
- return true;
|
||||
+ *val++ = (int)(msbs >> 1) ^ -(int)(msbs & 1);
|
||||
}
|
||||
|
||||
- uval = 0;
|
||||
- ++vals;
|
||||
-
|
||||
+ return true;
|
||||
}
|
||||
-}
|
||||
-#else
|
||||
-{
|
||||
- unsigned i;
|
||||
- unsigned uval = 0;
|
||||
|
||||
- /* try and get br->consumed_words and br->consumed_bits into register;
|
||||
- * must remember to flush them back to *br before calling other
|
||||
- * bitwriter functions that use them, and before returning */
|
||||
- register unsigned cwords;
|
||||
- register unsigned cbits;
|
||||
- unsigned ucbits; /* keep track of the number of unconsumed bits in the buffer */
|
||||
+ FLAC__ASSERT(parameter > 0);
|
||||
|
||||
- FLAC__ASSERT(0 != br);
|
||||
- FLAC__ASSERT(0 != br->buffer);
|
||||
- /* WATCHOUT: code does not work with <32bit words; we can make things much faster with this assertion */
|
||||
- FLAC__ASSERT(FLAC__BITS_PER_WORD >= 32);
|
||||
- FLAC__ASSERT(parameter < 32);
|
||||
- /* the above two asserts also guarantee that the binary part never straddles more than 2 words, so we don't have to loop to read it */
|
||||
+ cwords = br->consumed_words;
|
||||
+ words = br->words;
|
||||
|
||||
- if(nvals == 0)
|
||||
- return true;
|
||||
+ /* if we've not consumed up to a partial tail word... */
|
||||
+ if(cwords >= words) {
|
||||
+ x = 0;
|
||||
+ goto process_tail;
|
||||
+ }
|
||||
+
|
||||
+ ucbits = FLAC__BITS_PER_WORD - br->consumed_bits;
|
||||
+ b = br->buffer[cwords] << br->consumed_bits; /* keep unconsumed bits aligned to left */
|
||||
+
|
||||
+ while(val < end) {
|
||||
+ /* read the unary MSBs and end bit */
|
||||
+ x = y = COUNT_ZERO_MSBS(b);
|
||||
+ if(x == FLAC__BITS_PER_WORD) {
|
||||
+ x = ucbits;
|
||||
+ do {
|
||||
+ /* didn't find stop bit yet, have to keep going... */
|
||||
+ crc16_update_word_(br, br->buffer[cwords++]);
|
||||
+ if (cwords >= words)
|
||||
+ goto incomplete_msbs;
|
||||
+ b = br->buffer[cwords];
|
||||
+ y = COUNT_ZERO_MSBS(b);
|
||||
+ x += y;
|
||||
+ } while(y == FLAC__BITS_PER_WORD);
|
||||
+ }
|
||||
+ b <<= y;
|
||||
+ b <<= 1; /* account for stop bit */
|
||||
+ ucbits = (ucbits - x - 1) % FLAC__BITS_PER_WORD;
|
||||
+ msbs = x;
|
||||
+
|
||||
+ /* read the binary LSBs */
|
||||
+ x = b >> (FLAC__BITS_PER_WORD - parameter);
|
||||
+ if(parameter <= ucbits) {
|
||||
+ ucbits -= parameter;
|
||||
+ b <<= parameter;
|
||||
+ } else {
|
||||
+ /* there are still bits left to read, they will all be in the next word */
|
||||
+ crc16_update_word_(br, br->buffer[cwords++]);
|
||||
+ if (cwords >= words)
|
||||
+ goto incomplete_lsbs;
|
||||
+ b = br->buffer[cwords];
|
||||
+ ucbits += FLAC__BITS_PER_WORD - parameter;
|
||||
+ x |= b >> ucbits;
|
||||
+ b <<= FLAC__BITS_PER_WORD - ucbits;
|
||||
+ }
|
||||
+ lsbs = x;
|
||||
|
||||
- cbits = br->consumed_bits;
|
||||
- cwords = br->consumed_words;
|
||||
- ucbits = (br->words-cwords)*FLAC__BITS_PER_WORD + br->bytes*8 - cbits;
|
||||
+ /* compose the value */
|
||||
+ x = (msbs << parameter) | lsbs;
|
||||
+ *val++ = (int)(x >> 1) ^ -(int)(x & 1);
|
||||
|
||||
- while(1) {
|
||||
+ continue;
|
||||
|
||||
- /* read unary part */
|
||||
- while(1) {
|
||||
- while(cwords < br->words) { /* if we've not consumed up to a partial tail word... */
|
||||
- brword b = br->buffer[cwords] << cbits;
|
||||
- if(b) {
|
||||
-#if 0 /* is not discernably faster... */ && defined FLAC__CPU_IA32 && !defined FLAC__NO_ASM && FLAC__BITS_PER_WORD == 32 && defined __GNUC__
|
||||
- asm volatile (
|
||||
- "bsrl %1, %0;"
|
||||
- "notl %0;"
|
||||
- "andl $31, %0;"
|
||||
- : "=r"(i)
|
||||
- : "r"(b)
|
||||
- );
|
||||
-#else
|
||||
- i = COUNT_ZERO_MSBS(b);
|
||||
-#endif
|
||||
- uval += i;
|
||||
- cbits += i;
|
||||
- cbits++; /* skip over stop bit */
|
||||
- if(cbits >= FLAC__BITS_PER_WORD) { /* faster way of testing if(cbits == FLAC__BITS_PER_WORD) */
|
||||
- crc16_update_word_(br, br->buffer[cwords]);
|
||||
- cwords++;
|
||||
- cbits = 0;
|
||||
- }
|
||||
- goto break1;
|
||||
- }
|
||||
- else {
|
||||
- uval += FLAC__BITS_PER_WORD - cbits;
|
||||
- crc16_update_word_(br, br->buffer[cwords]);
|
||||
- cwords++;
|
||||
- cbits = 0;
|
||||
- /* didn't find stop bit yet, have to keep going... */
|
||||
- }
|
||||
- }
|
||||
- /* at this point we've eaten up all the whole words; have to try
|
||||
- * reading through any tail bytes before calling the read callback.
|
||||
- * this is a repeat of the above logic adjusted for the fact we
|
||||
- * don't have a whole word. note though if the client is feeding
|
||||
- * us data a byte at a time (unlikely), br->consumed_bits may not
|
||||
- * be zero.
|
||||
- */
|
||||
- if(br->bytes) {
|
||||
- const unsigned end = br->bytes * 8;
|
||||
- brword b = (br->buffer[cwords] & ~(FLAC__WORD_ALL_ONES >> end)) << cbits;
|
||||
- if(b) {
|
||||
- i = COUNT_ZERO_MSBS(b);
|
||||
- uval += i;
|
||||
- cbits += i;
|
||||
- cbits++; /* skip over stop bit */
|
||||
- FLAC__ASSERT(cbits < FLAC__BITS_PER_WORD);
|
||||
- goto break1;
|
||||
- }
|
||||
- else {
|
||||
- uval += end - cbits;
|
||||
- cbits += end;
|
||||
- FLAC__ASSERT(cbits < FLAC__BITS_PER_WORD);
|
||||
- /* didn't find stop bit yet, have to keep going... */
|
||||
- }
|
||||
+ /* at this point we've eaten up all the whole words */
|
||||
+process_tail:
|
||||
+ do {
|
||||
+ if(0) {
|
||||
+incomplete_msbs:
|
||||
+ br->consumed_bits = 0;
|
||||
+ br->consumed_words = cwords;
|
||||
}
|
||||
- /* flush registers and read; bitreader_read_from_client_() does
|
||||
- * not touch br->consumed_bits at all but we still need to set
|
||||
- * it in case it fails and we have to return false.
|
||||
- */
|
||||
- br->consumed_bits = cbits;
|
||||
- br->consumed_words = cwords;
|
||||
- if(!bitreader_read_from_client_(br))
|
||||
+
|
||||
+ /* read the unary MSBs and end bit */
|
||||
+ if(!FLAC__bitreader_read_unary_unsigned(br, &msbs))
|
||||
return false;
|
||||
- cwords = br->consumed_words;
|
||||
- ucbits = (br->words-cwords)*FLAC__BITS_PER_WORD + br->bytes*8 - cbits + uval;
|
||||
- /* + uval to offset our count by the # of unary bits already
|
||||
- * consumed before the read, because we will add these back
|
||||
- * in all at once at break1
|
||||
- */
|
||||
- }
|
||||
-break1:
|
||||
- ucbits -= uval;
|
||||
- ucbits--; /* account for stop bit */
|
||||
-
|
||||
- /* read binary part */
|
||||
- FLAC__ASSERT(cwords <= br->words);
|
||||
-
|
||||
- if(parameter) {
|
||||
- while(ucbits < parameter) {
|
||||
- /* flush registers and read; bitreader_read_from_client_() does
|
||||
- * not touch br->consumed_bits at all but we still need to set
|
||||
- * it in case it fails and we have to return false.
|
||||
- */
|
||||
- br->consumed_bits = cbits;
|
||||
+ msbs += x;
|
||||
+ x = ucbits = 0;
|
||||
+
|
||||
+ if(0) {
|
||||
+incomplete_lsbs:
|
||||
+ br->consumed_bits = 0;
|
||||
br->consumed_words = cwords;
|
||||
- if(!bitreader_read_from_client_(br))
|
||||
- return false;
|
||||
- cwords = br->consumed_words;
|
||||
- ucbits = (br->words-cwords)*FLAC__BITS_PER_WORD + br->bytes*8 - cbits;
|
||||
- }
|
||||
- if(cwords < br->words) { /* if we've not consumed up to a partial tail word... */
|
||||
- if(cbits) {
|
||||
- /* this also works when consumed_bits==0, it's just slower than necessary for that case */
|
||||
- const unsigned n = FLAC__BITS_PER_WORD - cbits;
|
||||
- const brword word = br->buffer[cwords];
|
||||
- if(parameter < n) {
|
||||
- uval <<= parameter;
|
||||
- uval |= (word & (FLAC__WORD_ALL_ONES >> cbits)) >> (n-parameter);
|
||||
- cbits += parameter;
|
||||
- }
|
||||
- else {
|
||||
- uval <<= n;
|
||||
- uval |= word & (FLAC__WORD_ALL_ONES >> cbits);
|
||||
- crc16_update_word_(br, word);
|
||||
- cwords++;
|
||||
- cbits = parameter - n;
|
||||
- if(cbits) { /* parameter > n, i.e. if there are still bits left to read, there have to be less than 32 so they will all be in the next word */
|
||||
- uval <<= cbits;
|
||||
- uval |= (br->buffer[cwords] >> (FLAC__BITS_PER_WORD-cbits));
|
||||
- }
|
||||
- }
|
||||
- }
|
||||
- else {
|
||||
- cbits = parameter;
|
||||
- uval <<= parameter;
|
||||
- uval |= br->buffer[cwords] >> (FLAC__BITS_PER_WORD-cbits);
|
||||
- }
|
||||
}
|
||||
- else {
|
||||
- /* in this case we're starting our read at a partial tail word;
|
||||
- * the reader has guaranteed that we have at least 'parameter'
|
||||
- * bits available to read, which makes this case simpler.
|
||||
- */
|
||||
- uval <<= parameter;
|
||||
- if(cbits) {
|
||||
- /* this also works when consumed_bits==0, it's just a little slower than necessary for that case */
|
||||
- FLAC__ASSERT(cbits + parameter <= br->bytes*8);
|
||||
- uval |= (br->buffer[cwords] & (FLAC__WORD_ALL_ONES >> cbits)) >> (FLAC__BITS_PER_WORD-cbits-parameter);
|
||||
- cbits += parameter;
|
||||
- }
|
||||
- else {
|
||||
- cbits = parameter;
|
||||
- uval |= br->buffer[cwords] >> (FLAC__BITS_PER_WORD-cbits);
|
||||
- }
|
||||
- }
|
||||
- }
|
||||
|
||||
- ucbits -= parameter;
|
||||
-
|
||||
- /* compose the value */
|
||||
- *vals = (int)(uval >> 1 ^ -(int)(uval & 1));
|
||||
+ /* read the binary LSBs */
|
||||
+ if(!FLAC__bitreader_read_raw_uint32(br, &lsbs, parameter - ucbits))
|
||||
+ return false;
|
||||
+ lsbs = x | lsbs;
|
||||
|
||||
- /* are we done? */
|
||||
- --nvals;
|
||||
- if(nvals == 0) {
|
||||
- br->consumed_bits = cbits;
|
||||
- br->consumed_words = cwords;
|
||||
- return true;
|
||||
- }
|
||||
+ /* compose the value */
|
||||
+ x = (msbs << parameter) | lsbs;
|
||||
+ *val++ = (int)(x >> 1) ^ -(int)(x & 1);
|
||||
+ x = 0;
|
||||
|
||||
- uval = 0;
|
||||
- ++vals;
|
||||
+ cwords = br->consumed_words;
|
||||
+ words = br->words;
|
||||
+ ucbits = FLAC__BITS_PER_WORD - br->consumed_bits;
|
||||
+ b = br->buffer[cwords] << br->consumed_bits;
|
||||
+ } while(cwords >= words && val < end);
|
||||
+ }
|
||||
|
||||
+ if(ucbits == 0 && cwords < words) {
|
||||
+ /* don't leave the head word with no unconsumed bits */
|
||||
+ crc16_update_word_(br, br->buffer[cwords++]);
|
||||
+ ucbits = FLAC__BITS_PER_WORD;
|
||||
}
|
||||
+
|
||||
+ br->consumed_bits = FLAC__BITS_PER_WORD - ucbits;
|
||||
+ br->consumed_words = cwords;
|
||||
+
|
||||
+ return true;
|
||||
}
|
||||
-#endif
|
||||
|
||||
#if 0 /* UNUSED */
|
||||
FLAC__bool FLAC__bitreader_read_golomb_signed(FLAC__BitReader *br, int *val, unsigned parameter)
|
45
flac-1.2.1-cflags.patch
Normal file
45
flac-1.2.1-cflags.patch
Normal file
@ -0,0 +1,45 @@
|
||||
diff -up flac-1.2.1/src/libFLAC/Makefile.am.cflags flac-1.2.1/src/libFLAC/Makefile.am
|
||||
--- flac-1.2.1/src/libFLAC/Makefile.am.cflags 2007-09-14 23:06:17.000000000 +0200
|
||||
+++ flac-1.2.1/src/libFLAC/Makefile.am 2008-03-17 14:19:29.000000000 +0100
|
||||
@@ -41,7 +41,7 @@ CPUCFLAGS = -faltivec -force_cpusubtype_
|
||||
else
|
||||
# Linux-gcc for PPC does not have -force_cpusubtype_ALL, it is Darwin-specific
|
||||
#@@@ PPC optimizations temporarily disabled
|
||||
-CPUCFLAGS = -maltivec -mabi=altivec -DFLAC__NO_ASM
|
||||
+CPUCFLAGS = -DFLAC__NO_ASM
|
||||
endif
|
||||
endif
|
||||
|
||||
@@ -69,7 +69,7 @@ endif
|
||||
endif
|
||||
endif
|
||||
|
||||
-libFLAC_la_LIBADD = $(LOCAL_EXTRA_LIBADD) @OGG_LIBS@
|
||||
+libFLAC_la_LIBADD = $(LOCAL_EXTRA_LIBADD) @OGG_LIBS@ libFLAC_extracflags.la
|
||||
|
||||
SUBDIRS = $(ARCH_SUBDIRS) include .
|
||||
|
||||
@@ -112,7 +112,10 @@ libFLAC_la_SOURCES = \
|
||||
metadata_iterators.c \
|
||||
metadata_object.c \
|
||||
stream_decoder.c \
|
||||
- stream_encoder.c \
|
||||
stream_encoder_framing.c \
|
||||
window.c \
|
||||
$(extra_ogg_sources)
|
||||
+
|
||||
+noinst_LTLIBRARIES = libFLAC_extracflags.la
|
||||
+libFLAC_extracflags_la_SOURCES = stream_encoder.c
|
||||
+libFLAC_extracflags_la_CFLAGS = $(AM_CFLAGS) -funroll-loops
|
||||
diff -up flac-1.2.1/configure.in.cflags flac-1.2.1/configure.in
|
||||
--- flac-1.2.1/configure.in.cflags 2007-09-13 17:48:42.000000000 +0200
|
||||
+++ flac-1.2.1/configure.in 2008-03-17 14:17:08.000000000 +0100
|
||||
@@ -301,7 +301,7 @@ else
|
||||
CPPFLAGS="-DNDEBUG $CPPFLAGS"
|
||||
if test "x$GCC" = xyes; then
|
||||
CPPFLAGS="-DFLaC__INLINE=__inline__ $CPPFLAGS"
|
||||
- CFLAGS="-O3 -funroll-loops -finline-functions -Wall -W -Winline $CFLAGS"
|
||||
+ CFLAGS="-Wall -W -Winline $CFLAGS"
|
||||
fi
|
||||
fi
|
||||
|
@ -1,12 +0,0 @@
|
||||
diff -up flac-1.2.1/src/libFLAC/Makefile.in.ppc flac-1.2.1/src/libFLAC/Makefile.in
|
||||
--- flac-1.2.1/src/libFLAC/Makefile.in.ppc 2007-09-16 22:05:12.000000000 +0200
|
||||
+++ flac-1.2.1/src/libFLAC/Makefile.in 2008-01-30 14:19:51.000000000 +0100
|
||||
@@ -240,7 +240,7 @@ lib_LTLIBRARIES = libFLAC.la
|
||||
@FLaC__CPU_PPC_TRUE@@FLaC__SYS_DARWIN_TRUE@CPUCFLAGS = -faltivec -force_cpusubtype_ALL -DFLAC__NO_ASM
|
||||
# Linux-gcc for PPC does not have -force_cpusubtype_ALL, it is Darwin-specific
|
||||
#@@@ PPC optimizations temporarily disabled
|
||||
-@FLaC__CPU_PPC_TRUE@@FLaC__SYS_DARWIN_FALSE@CPUCFLAGS = -maltivec -mabi=altivec -DFLAC__NO_ASM
|
||||
+@FLaC__CPU_PPC_TRUE@@FLaC__SYS_DARWIN_FALSE@CPUCFLAGS = -DFLAC__NO_ASM
|
||||
|
||||
AM_CFLAGS = $(DEBUGCFLAGS) $(CPUCFLAGS) @OGG_CFLAGS@
|
||||
@FLaC__CPU_PPC_TRUE@@FLaC__NO_ASM_FALSE@ARCH_SUBDIRS = ppc
|
@ -10,19 +10,20 @@ diff -up flac-1.2.1/test/test_seeking.sh.tests flac-1.2.1/test/test_seeking.sh
|
||||
fi
|
||||
|
||||
for suffix in '' '-s' ; do
|
||||
diff -up flac-1.2.1/test/Makefile.in.tests flac-1.2.1/test/Makefile.in
|
||||
--- flac-1.2.1/test/Makefile.in.tests 2007-09-16 22:05:27.000000000 +0200
|
||||
+++ flac-1.2.1/test/Makefile.in 2008-01-29 13:51:33.000000000 +0100
|
||||
@@ -231,8 +231,7 @@ TESTS = \
|
||||
./test_grabbag.sh \
|
||||
./test_flac.sh \
|
||||
./test_metaflac.sh \
|
||||
- ./test_seeking.sh \
|
||||
- ./test_streams.sh
|
||||
+ ./test_seeking.sh
|
||||
diff -up flac-1.2.1/test/test_streams.sh.tests flac-1.2.1/test/test_streams.sh
|
||||
--- flac-1.2.1/test/test_streams.sh.tests 2007-06-16 21:58:39.000000000 +0200
|
||||
+++ flac-1.2.1/test/test_streams.sh 2008-03-17 13:57:39.000000000 +0100
|
||||
@@ -39,6 +39,10 @@ if [ x"$FLAC__TEST_LEVEL" = x ] ; then
|
||||
FLAC__TEST_LEVEL=1
|
||||
fi
|
||||
|
||||
+if [ "$FLAC__TEST_LEVEL" -eq 0 ] ; then
|
||||
+ exit 0
|
||||
+fi
|
||||
+
|
||||
flac --help 1>/dev/null 2>/dev/null || die "ERROR can't find flac executable"
|
||||
|
||||
EXTRA_DIST = \
|
||||
run_flac ()
|
||||
diff -up flac-1.2.1/src/test_streams/main.c.tests flac-1.2.1/src/test_streams/main.c
|
||||
--- flac-1.2.1/src/test_streams/main.c.tests 2007-08-31 07:54:49.000000000 +0200
|
||||
+++ flac-1.2.1/src/test_streams/main.c 2008-01-29 13:53:46.000000000 +0100
|
||||
|
19
flac.spec
19
flac.spec
@ -1,7 +1,7 @@
|
||||
Summary: An encoder/decoder for the Free Lossless Audio Codec
|
||||
Name: flac
|
||||
Version: 1.2.1
|
||||
Release: 3%{?dist}
|
||||
Release: 4%{?dist}
|
||||
License: BSD and GPLv2+
|
||||
Group: Applications/Multimedia
|
||||
Source: http://prdownloads.sourceforge.net/flac/flac-%{version}.tar.gz
|
||||
@ -9,10 +9,12 @@ Patch1: flac-1.2.1-asm.patch
|
||||
Patch2: flac-1.2.1-gcc43.patch
|
||||
Patch3: flac-1.2.1-hidesyms.patch
|
||||
Patch4: flac-1.2.1-tests.patch
|
||||
Patch5: flac-1.2.1-ppc.patch
|
||||
Patch5: flac-1.2.1-cflags.patch
|
||||
Patch6: flac-1.2.1-bitreader.patch
|
||||
URL: http://flac.sourceforge.net/
|
||||
BuildRoot: %{_tmppath}/%{name}-%{version}-%{release}-root-%(%{__id_u} -n)
|
||||
BuildRequires: libogg-devel
|
||||
BuildRequires: automake autoconf libtool gettext-devel
|
||||
%ifarch %{ix86}
|
||||
# 2.0 supports symbol visibility
|
||||
BuildRequires: nasm >= 2.0
|
||||
@ -43,10 +45,15 @@ will use the Free Lossless Audio Codec.
|
||||
%patch3 -p1 -b .hidesyms
|
||||
# reduce number of tests
|
||||
%patch4 -p1 -b .tests
|
||||
%patch5 -p1 -b .ppc
|
||||
%patch5 -p1 -b .cflags
|
||||
%patch6 -p0 -b .bitreader
|
||||
|
||||
%build
|
||||
%configure --disable-xmms-plugin
|
||||
./autogen.sh -V
|
||||
|
||||
%configure \
|
||||
--disable-xmms-plugin \
|
||||
--disable-thorough-tests
|
||||
|
||||
make %{?_smp_mflags}
|
||||
|
||||
@ -84,6 +91,10 @@ rm -rf %{buildroot}
|
||||
%{_datadir}/aclocal/*.m4
|
||||
|
||||
%changelog
|
||||
* Mon Mar 17 2008 Miroslav Lichvar <mlichvar@redhat.com> 1.2.1-4
|
||||
- speed up decoding
|
||||
- CFLAGS cleanup
|
||||
|
||||
* Tue Feb 19 2008 Fedora Release Engineering <rel-eng@fedoraproject.org> - 1.2.1-3
|
||||
- Autorebuild for GCC 4.3
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user