Index: src/libFLAC/stream_encoder.c |
diff --git a/src/libFLAC/stream_encoder.c b/src/libFLAC/stream_encoder.c |
index fc0d22d971f87acb109e0cb2de47682975524a1d..45bdb252b6861842842d5183c8e49578f5131386 100644 |
--- a/src/libFLAC/stream_encoder.c |
+++ b/src/libFLAC/stream_encoder.c |
@@ -1,5 +1,6 @@ |
/* libFLAC - Free Lossless Audio Codec library |
- * Copyright (C) 2000,2001,2002,2003,2004,2005,2006,2007 Josh Coalson |
+ * Copyright (C) 2000-2009 Josh Coalson |
+ * Copyright (C) 2011-2014 Xiph.Org Foundation |
* |
* Redistribution and use in source and binary forms, with or without |
* modification, are permitted provided that the following conditions |
@@ -29,35 +30,18 @@ |
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
*/ |
-#if HAVE_CONFIG_H |
+#ifdef HAVE_CONFIG_H |
# include <config.h> |
#endif |
-#if defined _MSC_VER || defined __MINGW32__ |
-#include <io.h> /* for _setmode() */ |
-#include <fcntl.h> /* for _O_BINARY */ |
-#endif |
-#if defined __CYGWIN__ || defined __EMX__ |
-#include <io.h> /* for setmode(), O_BINARY */ |
-#include <fcntl.h> /* for _O_BINARY */ |
-#endif |
#include <limits.h> |
#include <stdio.h> |
#include <stdlib.h> /* for malloc() */ |
#include <string.h> /* for memcpy() */ |
#include <sys/types.h> /* for off_t */ |
-#if defined _MSC_VER || defined __BORLANDC__ || defined __MINGW32__ |
-#if _MSC_VER <= 1600 || defined __BORLANDC__ /* @@@ [2G limit] */ |
-#define fseeko fseek |
-#define ftello ftell |
-#else |
-#define fseeko _fseeki64 |
-#define ftello _ftelli64 |
-#endif |
-#endif |
+#include "share/compat.h" |
#include "FLAC/assert.h" |
#include "FLAC/stream_decoder.h" |
-#include "share/alloc.h" |
#include "protected/stream_encoder.h" |
#include "private/bitwriter.h" |
#include "private/bitmath.h" |
@@ -68,26 +52,17 @@ |
#include "private/lpc.h" |
#include "private/md5.h" |
#include "private/memory.h" |
+#include "private/macros.h" |
#if FLAC__HAS_OGG |
#include "private/ogg_helper.h" |
#include "private/ogg_mapping.h" |
#endif |
+#include "private/stream_encoder.h" |
#include "private/stream_encoder_framing.h" |
#include "private/window.h" |
+#include "share/alloc.h" |
+#include "share/private.h" |
-#ifndef FLaC__INLINE |
-#define FLaC__INLINE |
-#endif |
- |
-#ifdef min |
-#undef min |
-#endif |
-#define min(x,y) ((x)<(y)?(x):(y)) |
- |
-#ifdef max |
-#undef max |
-#endif |
-#define max(x,y) ((x)>(y)?(x):(y)) |
/* Exact Rice codeword length calculation is off by default. The simple |
* (and fast) estimation (of how many bits a residual value will be |
@@ -99,7 +74,7 @@ |
* parameter estimation in this encoder is very good, almost always |
* yielding compression within 0.1% of the optimal parameters. |
*/ |
-#undef ENABLE_RICE_PARAMETER_SEARCH |
+#undef ENABLE_RICE_PARAMETER_SEARCH |
typedef struct { |
@@ -111,7 +86,7 @@ typedef struct { |
typedef struct { |
const FLAC__byte *data; |
unsigned capacity; |
- size_t bytes; |
+ unsigned bytes; |
} verify_output; |
typedef enum { |
@@ -131,16 +106,18 @@ static struct CompressionLevels { |
unsigned min_residual_partition_order; |
unsigned max_residual_partition_order; |
unsigned rice_parameter_search_dist; |
+ const char *apodization; |
} compression_levels_[] = { |
- { false, false, 0, 0, false, false, false, 0, 3, 0 }, |
- { true , true , 0, 0, false, false, false, 0, 3, 0 }, |
- { true , false, 0, 0, false, false, false, 0, 3, 0 }, |
- { false, false, 6, 0, false, false, false, 0, 4, 0 }, |
- { true , true , 8, 0, false, false, false, 0, 4, 0 }, |
- { true , false, 8, 0, false, false, false, 0, 5, 0 }, |
- { true , false, 8, 0, false, false, false, 0, 6, 0 }, |
- { true , false, 8, 0, false, false, true , 0, 6, 0 }, |
- { true , false, 12, 0, false, false, true , 0, 6, 0 } |
+ { false, false, 0, 0, false, false, false, 0, 3, 0, "tukey(5e-1)" }, |
+ { true , true , 0, 0, false, false, false, 0, 3, 0, "tukey(5e-1)" }, |
+ { true , false, 0, 0, false, false, false, 0, 3, 0, "tukey(5e-1)" }, |
+ { false, false, 6, 0, false, false, false, 0, 4, 0, "tukey(5e-1)" }, |
+ { true , true , 8, 0, false, false, false, 0, 4, 0, "tukey(5e-1)" }, |
+ { true , false, 8, 0, false, false, false, 0, 5, 0, "tukey(5e-1)" }, |
+ { true , false, 8, 0, false, false, false, 0, 6, 0, "tukey(5e-1);partial_tukey(2)" }, |
+ { true , false, 12, 0, false, false, false, 0, 6, 0, "tukey(5e-1);partial_tukey(2)" }, |
+ { true , false, 12, 0, false, false, false, 0, 6, 0, "tukey(5e-1);partial_tukey(2);punchout_tukey(3)" } |
+ /* here we use locale-independent 5e-1 instead of 0.5 or 0,5 */ |
}; |
@@ -235,7 +212,7 @@ static unsigned evaluate_lpc_subframe_( |
#endif |
static unsigned evaluate_verbatim_subframe_( |
- FLAC__StreamEncoder *encoder, |
+ FLAC__StreamEncoder *encoder, |
const FLAC__int32 signal[], |
unsigned blocksize, |
unsigned subframe_bps, |
@@ -370,10 +347,13 @@ typedef struct FLAC__StreamEncoderPrivate { |
unsigned current_frame_number; |
FLAC__MD5Context md5context; |
FLAC__CPUInfo cpuinfo; |
+ void (*local_precompute_partition_info_sums)(const FLAC__int32 residual[], FLAC__uint64 abs_residual_partition_sums[], unsigned residual_samples, unsigned predictor_order, unsigned min_partition_order, unsigned max_partition_order, unsigned bps); |
#ifndef FLAC__INTEGER_ONLY_LIBRARY |
unsigned (*local_fixed_compute_best_predictor)(const FLAC__int32 data[], unsigned data_len, FLAC__float residual_bits_per_sample[FLAC__MAX_FIXED_ORDER+1]); |
+ unsigned (*local_fixed_compute_best_predictor_wide)(const FLAC__int32 data[], unsigned data_len, FLAC__float residual_bits_per_sample[FLAC__MAX_FIXED_ORDER+1]); |
#else |
unsigned (*local_fixed_compute_best_predictor)(const FLAC__int32 data[], unsigned data_len, FLAC__fixedpoint residual_bits_per_sample[FLAC__MAX_FIXED_ORDER+1]); |
+ unsigned (*local_fixed_compute_best_predictor_wide)(const FLAC__int32 data[], unsigned data_len, FLAC__fixedpoint residual_bits_per_sample[FLAC__MAX_FIXED_ORDER+1]); |
#endif |
#ifndef FLAC__INTEGER_ONLY_LIBRARY |
void (*local_lpc_compute_autocorrelation)(const FLAC__real data[], unsigned data_len, unsigned lag, FLAC__real autoc[]); |
@@ -480,7 +460,7 @@ FLAC_API const char * const FLAC__StreamEncoderInitStatusString[] = { |
"FLAC__STREAM_ENCODER_INIT_STATUS_ALREADY_INITIALIZED" |
}; |
-FLAC_API const char * const FLAC__treamEncoderReadStatusString[] = { |
+FLAC_API const char * const FLAC__StreamEncoderReadStatusString[] = { |
"FLAC__STREAM_ENCODER_READ_STATUS_CONTINUE", |
"FLAC__STREAM_ENCODER_READ_STATUS_END_OF_STREAM", |
"FLAC__STREAM_ENCODER_READ_STATUS_ABORT", |
@@ -529,18 +509,18 @@ FLAC_API FLAC__StreamEncoder *FLAC__stream_encoder_new(void) |
FLAC__ASSERT(sizeof(int) >= 4); /* we want to die right away if this is not true */ |
- encoder = (FLAC__StreamEncoder*)calloc(1, sizeof(FLAC__StreamEncoder)); |
+ encoder = calloc(1, sizeof(FLAC__StreamEncoder)); |
if(encoder == 0) { |
return 0; |
} |
- encoder->protected_ = (FLAC__StreamEncoderProtected*)calloc(1, sizeof(FLAC__StreamEncoderProtected)); |
+ encoder->protected_ = calloc(1, sizeof(FLAC__StreamEncoderProtected)); |
if(encoder->protected_ == 0) { |
free(encoder); |
return 0; |
} |
- encoder->private_ = (FLAC__StreamEncoderPrivate*)calloc(1, sizeof(FLAC__StreamEncoderPrivate)); |
+ encoder->private_ = calloc(1, sizeof(FLAC__StreamEncoderPrivate)); |
if(encoder->private_ == 0) { |
free(encoder->protected_); |
free(encoder); |
@@ -598,7 +578,9 @@ FLAC_API void FLAC__stream_encoder_delete(FLAC__StreamEncoder *encoder) |
{ |
unsigned i; |
- FLAC__ASSERT(0 != encoder); |
+ if (encoder == NULL) |
+ return ; |
+ |
FLAC__ASSERT(0 != encoder->protected_); |
FLAC__ASSERT(0 != encoder->private_); |
FLAC__ASSERT(0 != encoder->private_->frame); |
@@ -699,7 +681,7 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
if(encoder->protected_->bits_per_sample < 16) { |
/* @@@ need some data about how to set this here w.r.t. blocksize and sample rate */ |
/* @@@ until then we'll make a guess */ |
- encoder->protected_->qlp_coeff_precision = max(FLAC__MIN_QLP_COEFF_PRECISION, 2 + encoder->protected_->bits_per_sample / 2); |
+ encoder->protected_->qlp_coeff_precision = flac_max(FLAC__MIN_QLP_COEFF_PRECISION, 2 + encoder->protected_->bits_per_sample / 2); |
} |
else if(encoder->protected_->bits_per_sample == 16) { |
if(encoder->protected_->blocksize <= 192) |
@@ -731,20 +713,7 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
return FLAC__STREAM_ENCODER_INIT_STATUS_INVALID_QLP_COEFF_PRECISION; |
if(encoder->protected_->streamable_subset) { |
- if( |
- encoder->protected_->blocksize != 192 && |
- encoder->protected_->blocksize != 576 && |
- encoder->protected_->blocksize != 1152 && |
- encoder->protected_->blocksize != 2304 && |
- encoder->protected_->blocksize != 4608 && |
- encoder->protected_->blocksize != 256 && |
- encoder->protected_->blocksize != 512 && |
- encoder->protected_->blocksize != 1024 && |
- encoder->protected_->blocksize != 2048 && |
- encoder->protected_->blocksize != 4096 && |
- encoder->protected_->blocksize != 8192 && |
- encoder->protected_->blocksize != 16384 |
- ) |
+ if(!FLAC__format_blocksize_is_subset(encoder->protected_->blocksize, encoder->protected_->sample_rate)) |
return FLAC__STREAM_ENCODER_INIT_STATUS_NOT_STREAMABLE; |
if(!FLAC__format_sample_rate_is_subset(encoder->protected_->sample_rate)) |
return FLAC__STREAM_ENCODER_INIT_STATUS_NOT_STREAMABLE; |
@@ -777,12 +746,12 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
#if FLAC__HAS_OGG |
/* reorder metadata if necessary to ensure that any VORBIS_COMMENT is the first, according to the mapping spec */ |
if(is_ogg && 0 != encoder->protected_->metadata && encoder->protected_->num_metadata_blocks > 1) { |
- unsigned i; |
- for(i = 1; i < encoder->protected_->num_metadata_blocks; i++) { |
- if(0 != encoder->protected_->metadata[i] && encoder->protected_->metadata[i]->type == FLAC__METADATA_TYPE_VORBIS_COMMENT) { |
- FLAC__StreamMetadata *vc = encoder->protected_->metadata[i]; |
- for( ; i > 0; i--) |
- encoder->protected_->metadata[i] = encoder->protected_->metadata[i-1]; |
+ unsigned i1; |
+ for(i1 = 1; i1 < encoder->protected_->num_metadata_blocks; i1++) { |
+ if(0 != encoder->protected_->metadata[i1] && encoder->protected_->metadata[i1]->type == FLAC__METADATA_TYPE_VORBIS_COMMENT) { |
+ FLAC__StreamMetadata *vc = encoder->protected_->metadata[i1]; |
+ for( ; i1 > 0; i1--) |
+ encoder->protected_->metadata[i1] = encoder->protected_->metadata[i1-1]; |
encoder->protected_->metadata[0] = vc; |
break; |
} |
@@ -791,10 +760,10 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
#endif |
/* keep track of any SEEKTABLE block */ |
if(0 != encoder->protected_->metadata && encoder->protected_->num_metadata_blocks > 0) { |
- unsigned i; |
- for(i = 0; i < encoder->protected_->num_metadata_blocks; i++) { |
- if(0 != encoder->protected_->metadata[i] && encoder->protected_->metadata[i]->type == FLAC__METADATA_TYPE_SEEKTABLE) { |
- encoder->private_->seek_table = &encoder->protected_->metadata[i]->data.seek_table; |
+ unsigned i2; |
+ for(i2 = 0; i2 < encoder->protected_->num_metadata_blocks; i2++) { |
+ if(0 != encoder->protected_->metadata[i2] && encoder->protected_->metadata[i2]->type == FLAC__METADATA_TYPE_SEEKTABLE) { |
+ encoder->private_->seek_table = &encoder->protected_->metadata[i2]->data.seek_table; |
break; /* take only the first one */ |
} |
} |
@@ -836,7 +805,7 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
metadata_picture_has_type1 = true; |
/* standard icon must be 32x32 pixel PNG */ |
if( |
- m->data.picture.type == FLAC__STREAM_METADATA_PICTURE_TYPE_FILE_ICON_STANDARD && |
+ m->data.picture.type == FLAC__STREAM_METADATA_PICTURE_TYPE_FILE_ICON_STANDARD && |
( |
(strcmp(m->data.picture.mime_type, "image/png") && strcmp(m->data.picture.mime_type, "-->")) || |
m->data.picture.width != 32 || |
@@ -901,7 +870,7 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
encoder->private_->current_frame_number = 0; |
encoder->private_->use_wide_by_block = (encoder->protected_->bits_per_sample + FLAC__bitmath_ilog2(encoder->protected_->blocksize)+1 > 30); |
- encoder->private_->use_wide_by_order = (encoder->protected_->bits_per_sample + FLAC__bitmath_ilog2(max(encoder->protected_->max_lpc_order, FLAC__MAX_FIXED_ORDER))+1 > 30); /*@@@ need to use this? */ |
+ encoder->private_->use_wide_by_order = (encoder->protected_->bits_per_sample + FLAC__bitmath_ilog2(flac_max(encoder->protected_->max_lpc_order, FLAC__MAX_FIXED_ORDER))+1 > 30); /*@@@ need to use this? */ |
encoder->private_->use_wide_by_partition = (false); /*@@@ need to set this */ |
/* |
@@ -912,7 +881,9 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
#ifndef FLAC__INTEGER_ONLY_LIBRARY |
encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation; |
#endif |
+ encoder->private_->local_precompute_partition_info_sums = precompute_partition_info_sums_; |
encoder->private_->local_fixed_compute_best_predictor = FLAC__fixed_compute_best_predictor; |
+ encoder->private_->local_fixed_compute_best_predictor_wide = FLAC__fixed_compute_best_predictor_wide; |
#ifndef FLAC__INTEGER_ONLY_LIBRARY |
encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients; |
encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_64bit = FLAC__lpc_compute_residual_from_qlp_coefficients_wide; |
@@ -925,21 +896,23 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
# ifdef FLAC__CPU_IA32 |
FLAC__ASSERT(encoder->private_->cpuinfo.type == FLAC__CPUINFO_TYPE_IA32); |
# ifdef FLAC__HAS_NASM |
- if(encoder->private_->cpuinfo.data.ia32.sse) { |
+ if(encoder->private_->cpuinfo.ia32.sse) { |
if(encoder->protected_->max_lpc_order < 4) |
encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_asm_ia32_sse_lag_4; |
else if(encoder->protected_->max_lpc_order < 8) |
encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_asm_ia32_sse_lag_8; |
else if(encoder->protected_->max_lpc_order < 12) |
encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_asm_ia32_sse_lag_12; |
+ else if(encoder->protected_->max_lpc_order < 16) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_asm_ia32_sse_lag_16; |
else |
encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_asm_ia32; |
} |
- else if(encoder->private_->cpuinfo.data.ia32._3dnow) |
- encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_asm_ia32_3dnow; |
else |
encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_asm_ia32; |
- if(encoder->private_->cpuinfo.data.ia32.mmx) { |
+ |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_64bit = FLAC__lpc_compute_residual_from_qlp_coefficients_wide_asm_ia32; /* OPT_IA32: was really necessary for GCC < 4.9 */ |
+ if(encoder->private_->cpuinfo.ia32.mmx) { |
encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients_asm_ia32; |
encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_16bit = FLAC__lpc_compute_residual_from_qlp_coefficients_asm_ia32_mmx; |
} |
@@ -947,16 +920,137 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients_asm_ia32; |
encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_16bit = FLAC__lpc_compute_residual_from_qlp_coefficients_asm_ia32; |
} |
- if(encoder->private_->cpuinfo.data.ia32.mmx && encoder->private_->cpuinfo.data.ia32.cmov) |
+ |
+ if(encoder->private_->cpuinfo.ia32.mmx && encoder->private_->cpuinfo.ia32.cmov) |
encoder->private_->local_fixed_compute_best_predictor = FLAC__fixed_compute_best_predictor_asm_ia32_mmx_cmov; |
# endif /* FLAC__HAS_NASM */ |
-# endif /* FLAC__CPU_IA32 */ |
+# ifdef FLAC__HAS_X86INTRIN |
+# if defined FLAC__SSE_SUPPORTED |
+ if(encoder->private_->cpuinfo.ia32.sse) { |
+ if(encoder->protected_->max_lpc_order < 4) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_4; |
+ else if(encoder->protected_->max_lpc_order < 8) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_8; |
+ else if(encoder->protected_->max_lpc_order < 12) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12; |
+ else if(encoder->protected_->max_lpc_order < 16) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16; |
+ else |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation; |
+ } |
+# endif |
+ |
+# ifdef FLAC__SSE2_SUPPORTED |
+ if(encoder->private_->cpuinfo.ia32.sse2) { |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse2; |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_16bit = FLAC__lpc_compute_residual_from_qlp_coefficients_16_intrin_sse2; |
+ } |
+# endif |
+# ifdef FLAC__SSE4_1_SUPPORTED |
+ if(encoder->private_->cpuinfo.ia32.sse41) { |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41; |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_64bit = FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_sse41; |
+ } |
+# endif |
+# ifdef FLAC__AVX2_SUPPORTED |
+ if(encoder->private_->cpuinfo.ia32.avx2) { |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_16bit = FLAC__lpc_compute_residual_from_qlp_coefficients_16_intrin_avx2; |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_avx2; |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_64bit = FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2; |
+ } |
+# endif |
+ |
+# ifdef FLAC__SSE2_SUPPORTED |
+ if (encoder->private_->cpuinfo.ia32.sse2) { |
+ encoder->private_->local_fixed_compute_best_predictor = FLAC__fixed_compute_best_predictor_intrin_sse2; |
+ encoder->private_->local_fixed_compute_best_predictor_wide = FLAC__fixed_compute_best_predictor_wide_intrin_sse2; |
+ } |
+# endif |
+# ifdef FLAC__SSSE3_SUPPORTED |
+ if (encoder->private_->cpuinfo.ia32.ssse3) { |
+ encoder->private_->local_fixed_compute_best_predictor = FLAC__fixed_compute_best_predictor_intrin_ssse3; |
+ encoder->private_->local_fixed_compute_best_predictor_wide = FLAC__fixed_compute_best_predictor_wide_intrin_ssse3; |
+ } |
+# endif |
+# endif /* FLAC__HAS_X86INTRIN */ |
+# elif defined FLAC__CPU_X86_64 |
+ FLAC__ASSERT(encoder->private_->cpuinfo.type == FLAC__CPUINFO_TYPE_X86_64); |
+# ifdef FLAC__HAS_X86INTRIN |
+# ifdef FLAC__SSE_SUPPORTED |
+ if(encoder->protected_->max_lpc_order < 4) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_4; |
+ else if(encoder->protected_->max_lpc_order < 8) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_8; |
+ else if(encoder->protected_->max_lpc_order < 12) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12; |
+ else if(encoder->protected_->max_lpc_order < 16) |
+ encoder->private_->local_lpc_compute_autocorrelation = FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16; |
+# endif |
+ |
+# ifdef FLAC__SSE2_SUPPORTED |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_16bit = FLAC__lpc_compute_residual_from_qlp_coefficients_16_intrin_sse2; |
+# endif |
+# ifdef FLAC__SSE4_1_SUPPORTED |
+ if(encoder->private_->cpuinfo.x86.sse41) { |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41; |
+ } |
+# endif |
+# ifdef FLAC__AVX2_SUPPORTED |
+ if(encoder->private_->cpuinfo.x86.avx2) { |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_16bit = FLAC__lpc_compute_residual_from_qlp_coefficients_16_intrin_avx2; |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients = FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_avx2; |
+ encoder->private_->local_lpc_compute_residual_from_qlp_coefficients_64bit = FLAC__lpc_compute_residual_from_qlp_coefficients_wide_intrin_avx2; |
+ } |
+# endif |
+ |
+# ifdef FLAC__SSE2_SUPPORTED |
+ encoder->private_->local_fixed_compute_best_predictor = FLAC__fixed_compute_best_predictor_intrin_sse2; |
+ encoder->private_->local_fixed_compute_best_predictor_wide = FLAC__fixed_compute_best_predictor_wide_intrin_sse2; |
+# endif |
+# ifdef FLAC__SSSE3_SUPPORTED |
+ if (encoder->private_->cpuinfo.x86.ssse3) { |
+ encoder->private_->local_fixed_compute_best_predictor = FLAC__fixed_compute_best_predictor_intrin_ssse3; |
+ encoder->private_->local_fixed_compute_best_predictor_wide = FLAC__fixed_compute_best_predictor_wide_intrin_ssse3; |
+ } |
+# endif |
+# endif /* FLAC__HAS_X86INTRIN */ |
+# endif /* FLAC__CPU_... */ |
} |
# endif /* !FLAC__NO_ASM */ |
#endif /* !FLAC__INTEGER_ONLY_LIBRARY */ |
+#if !defined FLAC__NO_ASM && defined FLAC__HAS_X86INTRIN |
+ if(encoder->private_->cpuinfo.use_asm) { |
+# if defined FLAC__CPU_IA32 |
+# ifdef FLAC__SSE2_SUPPORTED |
+ if(encoder->private_->cpuinfo.ia32.sse2) |
+ encoder->private_->local_precompute_partition_info_sums = FLAC__precompute_partition_info_sums_intrin_sse2; |
+# endif |
+# ifdef FLAC__SSSE3_SUPPORTED |
+ if(encoder->private_->cpuinfo.ia32.ssse3) |
+ encoder->private_->local_precompute_partition_info_sums = FLAC__precompute_partition_info_sums_intrin_ssse3; |
+# endif |
+# ifdef FLAC__AVX2_SUPPORTED |
+ if(encoder->private_->cpuinfo.ia32.avx2) |
+ encoder->private_->local_precompute_partition_info_sums = FLAC__precompute_partition_info_sums_intrin_avx2; |
+# endif |
+# elif defined FLAC__CPU_X86_64 |
+# ifdef FLAC__SSE2_SUPPORTED |
+ encoder->private_->local_precompute_partition_info_sums = FLAC__precompute_partition_info_sums_intrin_sse2; |
+# endif |
+# ifdef FLAC__SSSE3_SUPPORTED |
+ if(encoder->private_->cpuinfo.x86.ssse3) |
+ encoder->private_->local_precompute_partition_info_sums = FLAC__precompute_partition_info_sums_intrin_ssse3; |
+# endif |
+# ifdef FLAC__AVX2_SUPPORTED |
+ if(encoder->private_->cpuinfo.x86.avx2) |
+ encoder->private_->local_precompute_partition_info_sums = FLAC__precompute_partition_info_sums_intrin_avx2; |
+# endif |
+# endif /* FLAC__CPU_... */ |
+ } |
+#endif /* !FLAC__NO_ASM && FLAC__HAS_X86INTRIN */ |
/* finally override based on wide-ness if necessary */ |
if(encoder->private_->use_wide_by_block) { |
- encoder->private_->local_fixed_compute_best_predictor = FLAC__fixed_compute_best_predictor_wide; |
+ encoder->private_->local_fixed_compute_best_predictor = encoder->private_->local_fixed_compute_best_predictor_wide; |
} |
/* set state to OK; from here on, errors are fatal and we'll override the state then */ |
@@ -997,7 +1091,7 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
*/ |
encoder->private_->verify.input_fifo.size = encoder->protected_->blocksize+OVERREAD_; |
for(i = 0; i < encoder->protected_->channels; i++) { |
- if(0 == (encoder->private_->verify.input_fifo.data[i] = (FLAC__int32*)safe_malloc_mul_2op_(sizeof(FLAC__int32), /*times*/encoder->private_->verify.input_fifo.size))) { |
+ if(0 == (encoder->private_->verify.input_fifo.data[i] = safe_malloc_mul_2op_p(sizeof(FLAC__int32), /*times*/encoder->private_->verify.input_fifo.size))) { |
encoder->protected_->state = FLAC__STREAM_ENCODER_MEMORY_ALLOCATION_ERROR; |
return FLAC__STREAM_ENCODER_INIT_STATUS_ENCODER_ERROR; |
} |
@@ -1007,10 +1101,12 @@ static FLAC__StreamEncoderInitStatus init_stream_internal_( |
/* |
* Now set up a stream decoder for verification |
*/ |
- encoder->private_->verify.decoder = FLAC__stream_decoder_new(); |
if(0 == encoder->private_->verify.decoder) { |
- encoder->protected_->state = FLAC__STREAM_ENCODER_VERIFY_DECODER_ERROR; |
- return FLAC__STREAM_ENCODER_INIT_STATUS_ENCODER_ERROR; |
+ encoder->private_->verify.decoder = FLAC__stream_decoder_new(); |
+ if(0 == encoder->private_->verify.decoder) { |
+ encoder->protected_->state = FLAC__STREAM_ENCODER_VERIFY_DECODER_ERROR; |
+ return FLAC__STREAM_ENCODER_INIT_STATUS_ENCODER_ERROR; |
+ } |
} |
if(FLAC__stream_decoder_init_stream(encoder->private_->verify.decoder, verify_read_callback_, /*seek_callback=*/0, /*tell_callback=*/0, /*length_callback=*/0, /*eof_callback=*/0, verify_write_callback_, verify_metadata_callback_, verify_error_callback_, /*client_data=*/encoder) != FLAC__STREAM_DECODER_INIT_STATUS_OK) { |
@@ -1183,7 +1279,7 @@ FLAC_API FLAC__StreamEncoderInitStatus FLAC__stream_encoder_init_ogg_stream( |
/*is_ogg=*/true |
); |
} |
- |
+ |
static FLAC__StreamEncoderInitStatus init_FILE_internal_( |
FLAC__StreamEncoder *encoder, |
FILE *file, |
@@ -1214,6 +1310,13 @@ static FLAC__StreamEncoderInitStatus init_FILE_internal_( |
if(file == stdout) |
file = get_binary_stdout_(); /* just to be safe */ |
+#ifdef _WIN32 |
+ /* |
+ * Windows can suffer quite badly from disk fragmentation. This can be |
+ * reduced significantly by setting the output buffer size to be 10MB. |
+ */ |
+ setvbuf(file, NULL, _IOFBF, 10*1024*1024); |
+#endif |
encoder->private_->file = file; |
encoder->private_->progress_callback = progress_callback; |
@@ -1245,7 +1348,7 @@ static FLAC__StreamEncoderInitStatus init_FILE_internal_( |
return init_status; |
} |
- |
+ |
FLAC_API FLAC__StreamEncoderInitStatus FLAC__stream_encoder_init_FILE( |
FLAC__StreamEncoder *encoder, |
FILE *file, |
@@ -1255,7 +1358,7 @@ FLAC_API FLAC__StreamEncoderInitStatus FLAC__stream_encoder_init_FILE( |
{ |
return init_FILE_internal_(encoder, file, progress_callback, client_data, /*is_ogg=*/false); |
} |
- |
+ |
FLAC_API FLAC__StreamEncoderInitStatus FLAC__stream_encoder_init_ogg_FILE( |
FLAC__StreamEncoder *encoder, |
FILE *file, |
@@ -1286,7 +1389,7 @@ static FLAC__StreamEncoderInitStatus init_file_internal_( |
if(encoder->protected_->state != FLAC__STREAM_ENCODER_UNINITIALIZED) |
return FLAC__STREAM_ENCODER_INIT_STATUS_ALREADY_INITIALIZED; |
- file = filename? fopen(filename, "w+b") : stdout; |
+ file = filename? flac_fopen(filename, "w+b") : stdout; |
if(file == 0) { |
encoder->protected_->state = FLAC__STREAM_ENCODER_IO_ERROR; |
@@ -1482,11 +1585,10 @@ FLAC_API FLAC__bool FLAC__stream_encoder_set_compression_level(FLAC__StreamEncod |
ok &= FLAC__stream_encoder_set_do_mid_side_stereo (encoder, compression_levels_[value].do_mid_side_stereo); |
ok &= FLAC__stream_encoder_set_loose_mid_side_stereo (encoder, compression_levels_[value].loose_mid_side_stereo); |
#ifndef FLAC__INTEGER_ONLY_LIBRARY |
-#if 0 |
- /* was: */ |
+#if 1 |
ok &= FLAC__stream_encoder_set_apodization (encoder, compression_levels_[value].apodization); |
- /* but it's too hard to specify the string in a locale-specific way */ |
#else |
+ /* equivalent to -A tukey(0.5) */ |
encoder->protected_->num_apodizations = 1; |
encoder->protected_->apodizations[0].type = FLAC__APODIZATION_TUKEY; |
encoder->protected_->apodizations[0].parameters.tukey.p = 0.5; |
@@ -1590,6 +1692,48 @@ FLAC_API FLAC__bool FLAC__stream_encoder_set_apodization(FLAC__StreamEncoder *en |
encoder->protected_->apodizations[encoder->protected_->num_apodizations++].type = FLAC__APODIZATION_TUKEY; |
} |
} |
+ else if(n>15 && 0 == strncmp("partial_tukey(" , specification, 14)) { |
+ FLAC__int32 tukey_parts = (FLAC__int32)strtod(specification+14, 0); |
+ const char *si_1 = strchr(specification, '/'); |
+ FLAC__real overlap = si_1?flac_min((FLAC__real)strtod(si_1+1, 0),0.99f):0.1f; |
+ FLAC__real overlap_units = 1.0f/(1.0f - overlap) - 1.0f; |
+ const char *si_2 = strchr((si_1?(si_1+1):specification), '/'); |
+ FLAC__real tukey_p = si_2?(FLAC__real)strtod(si_2+1, 0):0.2f; |
+ |
+ if (tukey_parts <= 1) { |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.tukey.p = tukey_p; |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations++].type = FLAC__APODIZATION_TUKEY; |
+ }else if (encoder->protected_->num_apodizations + tukey_parts < 32){ |
+ FLAC__int32 m; |
+ for(m = 0; m < tukey_parts; m++){ |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.multiple_tukey.p = tukey_p; |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.multiple_tukey.start = m/(tukey_parts+overlap_units); |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.multiple_tukey.end = (m+1+overlap_units)/(tukey_parts+overlap_units); |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations++].type = FLAC__APODIZATION_PARTIAL_TUKEY; |
+ } |
+ } |
+ } |
+ else if(n>16 && 0 == strncmp("punchout_tukey(" , specification, 15)) { |
+ FLAC__int32 tukey_parts = (FLAC__int32)strtod(specification+15, 0); |
+ const char *si_1 = strchr(specification, '/'); |
+ FLAC__real overlap = si_1?flac_min((FLAC__real)strtod(si_1+1, 0),0.99f):0.2f; |
+ FLAC__real overlap_units = 1.0f/(1.0f - overlap) - 1.0f; |
+ const char *si_2 = strchr((si_1?(si_1+1):specification), '/'); |
+ FLAC__real tukey_p = si_2?(FLAC__real)strtod(si_2+1, 0):0.2f; |
+ |
+ if (tukey_parts <= 1) { |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.tukey.p = tukey_p; |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations++].type = FLAC__APODIZATION_TUKEY; |
+ }else if (encoder->protected_->num_apodizations + tukey_parts < 32){ |
+ FLAC__int32 m; |
+ for(m = 0; m < tukey_parts; m++){ |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.multiple_tukey.p = tukey_p; |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.multiple_tukey.start = m/(tukey_parts+overlap_units); |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations].parameters.multiple_tukey.end = (m+1+overlap_units)/(tukey_parts+overlap_units); |
+ encoder->protected_->apodizations[encoder->protected_->num_apodizations++].type = FLAC__APODIZATION_PUNCHOUT_TUKEY; |
+ } |
+ } |
+ } |
else if(n==5 && 0 == strncmp("welch" , specification, n)) |
encoder->protected_->apodizations[encoder->protected_->num_apodizations++].type = FLAC__APODIZATION_WELCH; |
if (encoder->protected_->num_apodizations == 32) |
@@ -1736,7 +1880,7 @@ FLAC_API FLAC__bool FLAC__stream_encoder_set_metadata(FLAC__StreamEncoder *encod |
} |
if(num_blocks) { |
FLAC__StreamMetadata **m; |
- if(0 == (m = (FLAC__StreamMetadata**)safe_malloc_mul_2op_(sizeof(m[0]), /*times*/num_blocks))) |
+ if(0 == (m = safe_malloc_mul_2op_p(sizeof(m[0]), /*times*/num_blocks))) |
return false; |
memcpy(m, metadata, sizeof(m[0]) * num_blocks); |
encoder->protected_->metadata = m; |
@@ -1990,7 +2134,7 @@ FLAC_API FLAC__bool FLAC__stream_encoder_process(FLAC__StreamEncoder *encoder, c |
FLAC__ASSERT(encoder->protected_->state == FLAC__STREAM_ENCODER_OK); |
do { |
- const unsigned n = min(blocksize+OVERREAD_-encoder->private_->current_sample_number, samples-j); |
+ const unsigned n = flac_min(blocksize+OVERREAD_-encoder->private_->current_sample_number, samples-j); |
if(encoder->protected_->verify) |
append_to_verify_fifo_(&encoder->private_->verify.input_fifo, buffer, j, channels, n); |
@@ -2053,7 +2197,7 @@ FLAC_API FLAC__bool FLAC__stream_encoder_process_interleaved(FLAC__StreamEncoder |
*/ |
do { |
if(encoder->protected_->verify) |
- append_to_verify_fifo_interleaved_(&encoder->private_->verify.input_fifo, buffer, j, channels, min(blocksize+OVERREAD_-encoder->private_->current_sample_number, samples-j)); |
+ append_to_verify_fifo_interleaved_(&encoder->private_->verify.input_fifo, buffer, j, channels, flac_min(blocksize+OVERREAD_-encoder->private_->current_sample_number, samples-j)); |
/* "i <= blocksize" to overread 1 sample; see comment in OVERREAD_ decl */ |
for(i = encoder->private_->current_sample_number; i <= blocksize && j < samples; i++, j++) { |
@@ -2088,7 +2232,7 @@ FLAC_API FLAC__bool FLAC__stream_encoder_process_interleaved(FLAC__StreamEncoder |
*/ |
do { |
if(encoder->protected_->verify) |
- append_to_verify_fifo_interleaved_(&encoder->private_->verify.input_fifo, buffer, j, channels, min(blocksize+OVERREAD_-encoder->private_->current_sample_number, samples-j)); |
+ append_to_verify_fifo_interleaved_(&encoder->private_->verify.input_fifo, buffer, j, channels, flac_min(blocksize+OVERREAD_-encoder->private_->current_sample_number, samples-j)); |
/* "i <= blocksize" to overread 1 sample; see comment in OVERREAD_ decl */ |
for(i = encoder->private_->current_sample_number; i <= blocksize && j < samples; i++, j++) { |
@@ -2171,6 +2315,8 @@ void set_defaults_(FLAC__StreamEncoder *encoder) |
#if FLAC__HAS_OGG |
FLAC__ogg_encoder_aspect_set_defaults(&encoder->protected_->ogg_encoder_aspect); |
#endif |
+ |
+ FLAC__stream_encoder_set_compression_level(encoder, 5); |
} |
void free_(FLAC__StreamEncoder *encoder) |
@@ -2269,8 +2415,8 @@ FLAC__bool resize_buffers_(FLAC__StreamEncoder *encoder, unsigned new_blocksize) |
ok = true; |
- /* WATCHOUT: FLAC__lpc_compute_residual_from_qlp_coefficients_asm_ia32_mmx() |
- * requires that the input arrays (in our case the integer signals) |
+ /* WATCHOUT: FLAC__lpc_compute_residual_from_qlp_coefficients_asm_ia32_mmx() and ..._intrin_sse2() |
+ * require that the input arrays (in our case the integer signals) |
* have a buffer of up to 3 zeroes in front (at negative indices) for |
* alignment purposes; we use 4 in front to keep the data well-aligned. |
*/ |
@@ -2367,6 +2513,12 @@ FLAC__bool resize_buffers_(FLAC__StreamEncoder *encoder, unsigned new_blocksize) |
case FLAC__APODIZATION_TUKEY: |
FLAC__window_tukey(encoder->private_->window[i], new_blocksize, encoder->protected_->apodizations[i].parameters.tukey.p); |
break; |
+ case FLAC__APODIZATION_PARTIAL_TUKEY: |
+ FLAC__window_partial_tukey(encoder->private_->window[i], new_blocksize, encoder->protected_->apodizations[i].parameters.multiple_tukey.p, encoder->protected_->apodizations[i].parameters.multiple_tukey.start, encoder->protected_->apodizations[i].parameters.multiple_tukey.end); |
+ break; |
+ case FLAC__APODIZATION_PUNCHOUT_TUKEY: |
+ FLAC__window_punchout_tukey(encoder->private_->window[i], new_blocksize, encoder->protected_->apodizations[i].parameters.multiple_tukey.p, encoder->protected_->apodizations[i].parameters.multiple_tukey.start, encoder->protected_->apodizations[i].parameters.multiple_tukey.end); |
+ break; |
case FLAC__APODIZATION_WELCH: |
FLAC__window_welch(encoder->private_->window[i], new_blocksize); |
break; |
@@ -2428,8 +2580,8 @@ FLAC__bool write_bitbuffer_(FLAC__StreamEncoder *encoder, unsigned samples, FLAC |
FLAC__bitwriter_clear(encoder->private_->frame); |
if(samples > 0) { |
- encoder->private_->streaminfo.data.stream_info.min_framesize = (unsigned)min(bytes, encoder->private_->streaminfo.data.stream_info.min_framesize); |
- encoder->private_->streaminfo.data.stream_info.max_framesize = (unsigned)max(bytes, encoder->private_->streaminfo.data.stream_info.max_framesize); |
+ encoder->private_->streaminfo.data.stream_info.min_framesize = flac_min(bytes, encoder->private_->streaminfo.data.stream_info.min_framesize); |
+ encoder->private_->streaminfo.data.stream_info.max_framesize = flac_max(bytes, encoder->private_->streaminfo.data.stream_info.max_framesize); |
} |
return true; |
@@ -2440,6 +2592,10 @@ FLAC__StreamEncoderWriteStatus write_frame_(FLAC__StreamEncoder *encoder, const |
FLAC__StreamEncoderWriteStatus status; |
FLAC__uint64 output_position = 0; |
+#if FLAC__HAS_OGG == 0 |
+ (void)is_last_block; |
+#endif |
+ |
/* FLAC__STREAM_ENCODER_TELL_STATUS_UNSUPPORTED just means we didn't get the offset; no error */ |
if(encoder->private_->tell_callback && encoder->private_->tell_callback(encoder, &output_position, encoder->private_->client_data) == FLAC__STREAM_ENCODER_TELL_STATUS_ERROR) { |
encoder->protected_->state = FLAC__STREAM_ENCODER_CLIENT_ERROR; |
@@ -2516,7 +2672,7 @@ FLAC__StreamEncoderWriteStatus write_frame_(FLAC__StreamEncoder *encoder, const |
* when the encoder goes back to write metadata, 'current_frame' |
* will drop back to 0. |
*/ |
- encoder->private_->frames_written = max(encoder->private_->frames_written, encoder->private_->current_frame_number+1); |
+ encoder->private_->frames_written = flac_max(encoder->private_->frames_written, encoder->private_->current_frame_number+1); |
} |
else |
encoder->protected_->state = FLAC__STREAM_ENCODER_CLIENT_ERROR; |
@@ -2527,7 +2683,7 @@ FLAC__StreamEncoderWriteStatus write_frame_(FLAC__StreamEncoder *encoder, const |
/* Gets called when the encoding process has finished so that we can update the STREAMINFO and SEEKTABLE blocks. */ |
void update_metadata_(const FLAC__StreamEncoder *encoder) |
{ |
- FLAC__byte b[max(6, FLAC__STREAM_METADATA_SEEKPOINT_LENGTH)]; |
+ FLAC__byte b[flac_max(6u, FLAC__STREAM_METADATA_SEEKPOINT_LENGTH)]; |
const FLAC__StreamMetadata *metadata = &encoder->private_->streaminfo; |
const FLAC__uint64 samples = metadata->data.stream_info.total_samples; |
const unsigned min_framesize = metadata->data.stream_info.min_framesize; |
@@ -2692,7 +2848,7 @@ void update_ogg_metadata_(FLAC__StreamEncoder *encoder) |
FLAC__OGG_MAPPING_NUM_HEADERS_LENGTH + |
FLAC__STREAM_SYNC_LENGTH |
; |
- FLAC__byte b[max(6, FLAC__STREAM_METADATA_SEEKPOINT_LENGTH)]; |
+ FLAC__byte b[flac_max(6u, FLAC__STREAM_METADATA_SEEKPOINT_LENGTH)]; |
const FLAC__StreamMetadata *metadata = &encoder->private_->streaminfo; |
const FLAC__uint64 samples = metadata->data.stream_info.total_samples; |
const unsigned min_framesize = metadata->data.stream_info.min_framesize; |
@@ -2943,9 +3099,9 @@ FLAC__bool process_subframes_(FLAC__StreamEncoder *encoder, FLAC__bool is_fracti |
} |
else { |
max_partition_order = FLAC__format_get_max_rice_partition_order_from_blocksize(encoder->protected_->blocksize); |
- max_partition_order = min(max_partition_order, encoder->protected_->max_residual_partition_order); |
+ max_partition_order = flac_min(max_partition_order, encoder->protected_->max_residual_partition_order); |
} |
- min_partition_order = min(min_partition_order, max_partition_order); |
+ min_partition_order = flac_min(min_partition_order, max_partition_order); |
/* |
* Setup the frame |
@@ -3194,7 +3350,7 @@ FLAC__bool process_subframe_( |
#endif |
#ifndef FLAC__INTEGER_ONLY_LIBRARY |
FLAC__double lpc_residual_bits_per_sample; |
- FLAC__real autoc[FLAC__MAX_LPC_ORDER+1]; /* WATCHOUT: the size is important even though encoder->protected_->max_lpc_order might be less; some asm routines need all the space */ |
+ FLAC__real autoc[FLAC__MAX_LPC_ORDER+1]; /* WATCHOUT: the size is important even though encoder->protected_->max_lpc_order might be less; some asm and x86 intrinsic routines need all the space */ |
FLAC__double lpc_error[FLAC__MAX_LPC_ORDER]; |
unsigned min_lpc_order, max_lpc_order, lpc_order; |
unsigned min_qlp_coeff_precision, max_qlp_coeff_precision, qlp_coeff_precision; |
@@ -3347,10 +3503,10 @@ FLAC__bool process_subframe_( |
} |
if(encoder->protected_->do_qlp_coeff_prec_search) { |
min_qlp_coeff_precision = FLAC__MIN_QLP_COEFF_PRECISION; |
- /* try to ensure a 32-bit datapath throughout for 16bps(+1bps for side channel) or less */ |
- if(subframe_bps <= 17) { |
- max_qlp_coeff_precision = min(32 - subframe_bps - lpc_order, FLAC__MAX_QLP_COEFF_PRECISION); |
- max_qlp_coeff_precision = max(max_qlp_coeff_precision, min_qlp_coeff_precision); |
+ /* try to keep qlp coeff precision such that only 32-bit math is required for decode of <=16bps streams */ |
+ if(subframe_bps <= 16) { |
+ max_qlp_coeff_precision = flac_min(32 - subframe_bps - FLAC__bitmath_ilog2(lpc_order), FLAC__MAX_QLP_COEFF_PRECISION); |
+ max_qlp_coeff_precision = flac_max(max_qlp_coeff_precision, min_qlp_coeff_precision); |
} |
else |
max_qlp_coeff_precision = FLAC__MAX_QLP_COEFF_PRECISION; |
@@ -3585,7 +3741,7 @@ unsigned evaluate_lpc_subframe_( |
FLAC__EntropyCodingMethod_PartitionedRiceContents *partitioned_rice_contents |
) |
{ |
- FLAC__int32 qlp_coeff[FLAC__MAX_LPC_ORDER]; |
+ FLAC__int32 qlp_coeff[FLAC__MAX_LPC_ORDER]; /* WATCHOUT: the size is important; some x86 intrinsic routines need more than lpc order elements */ |
unsigned i, residual_bits, estimate; |
int quantization, ret; |
const unsigned residual_samples = blocksize - order; |
@@ -3594,7 +3750,7 @@ unsigned evaluate_lpc_subframe_( |
if(subframe_bps <= 16) { |
FLAC__ASSERT(order > 0); |
FLAC__ASSERT(order <= FLAC__MAX_LPC_ORDER); |
- qlp_coeff_precision = min(qlp_coeff_precision, 32 - subframe_bps - FLAC__bitmath_ilog2(order)); |
+ qlp_coeff_precision = flac_min(qlp_coeff_precision, 32 - subframe_bps - FLAC__bitmath_ilog2(order)); |
} |
ret = FLAC__lpc_quantize_coefficients(lp_coeff, order, qlp_coeff_precision, qlp_coeff, &quantization); |
@@ -3698,9 +3854,9 @@ unsigned find_best_partition_order_( |
const unsigned blocksize = residual_samples + predictor_order; |
max_partition_order = FLAC__format_get_max_rice_partition_order_from_blocksize_limited_max_and_predictor_order(max_partition_order, blocksize, predictor_order); |
- min_partition_order = min(min_partition_order, max_partition_order); |
+ min_partition_order = flac_min(min_partition_order, max_partition_order); |
- precompute_partition_info_sums_(residual, abs_residual_partition_sums, residual_samples, predictor_order, min_partition_order, max_partition_order, bps); |
+ private_->local_precompute_partition_info_sums(residual, abs_residual_partition_sums, residual_samples, predictor_order, min_partition_order, max_partition_order, bps); |
if(do_escape_coding) |
precompute_partition_info_escapes_(residual, raw_bits_per_partition, residual_samples, predictor_order, min_partition_order, max_partition_order); |
@@ -3752,10 +3908,10 @@ unsigned find_best_partition_order_( |
unsigned partition; |
/* save best parameters and raw_bits */ |
- FLAC__format_entropy_coding_method_partitioned_rice_contents_ensure_size(prc, max(6, best_partition_order)); |
- memcpy(prc->parameters, private_->partitioned_rice_contents_extra[best_parameters_index].parameters, sizeof(unsigned)*((size_t)1<<(best_partition_order))); |
+ FLAC__format_entropy_coding_method_partitioned_rice_contents_ensure_size(prc, flac_max(6u, best_partition_order)); |
+ memcpy(prc->parameters, private_->partitioned_rice_contents_extra[best_parameters_index].parameters, sizeof(unsigned)*(1<<(best_partition_order))); |
if(do_escape_coding) |
- memcpy(prc->raw_bits, private_->partitioned_rice_contents_extra[best_parameters_index].raw_bits, sizeof(unsigned)*((size_t)1<<(best_partition_order))); |
+ memcpy(prc->raw_bits, private_->partitioned_rice_contents_extra[best_parameters_index].raw_bits, sizeof(unsigned)*(1<<(best_partition_order))); |
/* |
* Now need to check if the type should be changed to |
* FLAC__ENTROPY_CODING_METHOD_PARTITIONED_RICE2 based on the |
@@ -3772,17 +3928,6 @@ unsigned find_best_partition_order_( |
return best_residual_bits; |
} |
-#if defined(FLAC__CPU_IA32) && !defined FLAC__NO_ASM && defined FLAC__HAS_NASM |
-extern void precompute_partition_info_sums_32bit_asm_ia32_( |
- const FLAC__int32 residual[], |
- FLAC__uint64 abs_residual_partition_sums[], |
- unsigned blocksize, |
- unsigned predictor_order, |
- unsigned min_partition_order, |
- unsigned max_partition_order |
-); |
-#endif |
- |
void precompute_partition_info_sums_( |
const FLAC__int32 residual[], |
FLAC__uint64 abs_residual_partition_sums[], |
@@ -3798,21 +3943,12 @@ void precompute_partition_info_sums_( |
FLAC__ASSERT(default_partition_samples > predictor_order); |
-#if defined(FLAC__CPU_IA32) && !defined FLAC__NO_ASM && defined FLAC__HAS_NASM |
- /* slightly pessimistic but still catches all common cases */ |
- /* WATCHOUT: "+ bps" is an assumption that the average residual magnitude will not be more than "bps" bits */ |
- if(FLAC__bitmath_ilog2(default_partition_samples) + bps < 32) { |
- precompute_partition_info_sums_32bit_asm_ia32_(residual, abs_residual_partition_sums, residual_samples + predictor_order, predictor_order, min_partition_order, max_partition_order); |
- return; |
- } |
-#endif |
- |
/* first do max_partition_order */ |
{ |
unsigned partition, residual_sample, end = (unsigned)(-(int)predictor_order); |
- /* slightly pessimistic but still catches all common cases */ |
- /* WATCHOUT: "+ bps" is an assumption that the average residual magnitude will not be more than "bps" bits */ |
- if(FLAC__bitmath_ilog2(default_partition_samples) + bps < 32) { |
+ /* WATCHOUT: "+ bps + FLAC__MAX_EXTRA_RESIDUAL_BPS" is the maximum |
+ * assumed size of the average residual magnitude */ |
+ if(FLAC__bitmath_ilog2(default_partition_samples) + bps + FLAC__MAX_EXTRA_RESIDUAL_BPS < 32) { |
FLAC__uint32 abs_residual_partition_sum; |
for(partition = residual_sample = 0; partition < partitions; partition++) { |
@@ -3904,7 +4040,7 @@ void precompute_partition_info_escapes_( |
for(i = 0; i < partitions; i++) { |
m = raw_bits_per_partition[from_partition]; |
from_partition++; |
- raw_bits_per_partition[to_partition] = max(m, raw_bits_per_partition[from_partition]); |
+ raw_bits_per_partition[to_partition] = flac_max(m, raw_bits_per_partition[from_partition]); |
from_partition++; |
to_partition++; |
} |
@@ -3912,7 +4048,7 @@ void precompute_partition_info_escapes_( |
} |
#ifdef EXACT_RICE_BITS_CALCULATION |
-static FLaC__INLINE unsigned count_rice_bits_in_partition_( |
+static inline unsigned count_rice_bits_in_partition_( |
const unsigned rice_parameter, |
const unsigned partition_samples, |
const FLAC__int32 *residual |
@@ -3927,7 +4063,7 @@ static FLaC__INLINE unsigned count_rice_bits_in_partition_( |
return partition_bits; |
} |
#else |
-static FLaC__INLINE unsigned count_rice_bits_in_partition_( |
+static inline unsigned count_rice_bits_in_partition_( |
const unsigned rice_parameter, |
const unsigned partition_samples, |
const FLAC__uint64 abs_residual_partition_sum |
@@ -3982,7 +4118,7 @@ FLAC__bool set_partitioned_rice_( |
FLAC__ASSERT(suggested_rice_parameter < FLAC__ENTROPY_CODING_METHOD_PARTITIONED_RICE2_ESCAPE_PARAMETER); |
FLAC__ASSERT(rice_parameter_limit <= FLAC__ENTROPY_CODING_METHOD_PARTITIONED_RICE2_ESCAPE_PARAMETER); |
- FLAC__format_entropy_coding_method_partitioned_rice_contents_ensure_size(partitioned_rice_contents, max(6, partition_order)); |
+ FLAC__format_entropy_coding_method_partitioned_rice_contents_ensure_size(partitioned_rice_contents, flac_max(6u, partition_order)); |
parameters = partitioned_rice_contents->parameters; |
raw_bits = partitioned_rice_contents->raw_bits; |
@@ -4056,8 +4192,35 @@ FLAC__bool set_partitioned_rice_( |
* in the partition, so the actual mean is |
* mean/partition_samples |
*/ |
+#if 0 /* old simple code */ |
for(rice_parameter = 0, k = partition_samples; k < mean; rice_parameter++, k <<= 1) |
; |
+#else |
+#if defined FLAC__CPU_X86_64 /* and other 64-bit arch, too */ |
+ if(mean <= 0x80000000/512) { /* 512: more or less optimal for both 16- and 24-bit input */ |
+#else |
+ if(mean <= 0x80000000/8) { /* 32-bit arch: use 32-bit math if possible */ |
+#endif |
+ FLAC__uint32 k2, mean2 = (FLAC__uint32) mean; |
+ rice_parameter = 0; k2 = partition_samples; |
+ while(k2*8 < mean2) { /* requires: mean <= (2^31)/8 */ |
+ rice_parameter += 4; k2 <<= 4; /* tuned for 16-bit input */ |
+ } |
+ while(k2 < mean2) { /* requires: mean <= 2^31 */ |
+ rice_parameter++; k2 <<= 1; |
+ } |
+ } |
+ else { |
+ rice_parameter = 0; k = partition_samples; |
+ if(mean <= FLAC__U64L(0x8000000000000000)/128) /* usually mean is _much_ smaller than this value */ |
+ while(k*128 < mean) { /* requires: mean <= (2^63)/128 */ |
+ rice_parameter += 8; k <<= 8; /* tuned for 24-bit input */ |
+ } |
+ while(k < mean) { /* requires: mean <= 2^63 */ |
+ rice_parameter++; k <<= 1; |
+ } |
+ } |
+#endif |
if(rice_parameter >= rice_parameter_limit) { |
#ifdef DEBUG_VERBOSE |
fprintf(stderr, "clipping rice_parameter (%u -> %u) @6\n", rice_parameter, rice_parameter_limit - 1); |
@@ -4274,7 +4437,7 @@ FLAC__StreamEncoderSeekStatus file_seek_callback_(const FLAC__StreamEncoder *enc |
{ |
(void)client_data; |
- if(fseeko(encoder->private_->file, (off_t)absolute_byte_offset, SEEK_SET) < 0) |
+ if(fseeko(encoder->private_->file, (FLAC__off_t)absolute_byte_offset, SEEK_SET) < 0) |
return FLAC__STREAM_ENCODER_SEEK_STATUS_ERROR; |
else |
return FLAC__STREAM_ENCODER_SEEK_STATUS_OK; |
@@ -4282,7 +4445,7 @@ FLAC__StreamEncoderSeekStatus file_seek_callback_(const FLAC__StreamEncoder *enc |
FLAC__StreamEncoderTellStatus file_tell_callback_(const FLAC__StreamEncoder *encoder, FLAC__uint64 *absolute_byte_offset, void *client_data) |
{ |
- off_t offset; |
+ FLAC__off_t offset; |
(void)client_data; |