third_party/opus/src/src/opus_multistream_encoder.c - Issue 2962373002: [Opus] Update to v1.2.1

Unified Diff: third_party/opus/src/src/opus_multistream_encoder.c

Issue 2962373002: [Opus] Update to v1.2.1 (Closed)

Patch Set: Pre-increment instead of post-increment Created 3 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: third_party/opus/src/src/opus_multistream_encoder.c

diff --git a/third_party/opus/src/src/opus_multistream_encoder.c b/third_party/opus/src/src/opus_multistream_encoder.c

index 1698223a16a43536b5dc5fc326244657914a856b..032fc0039b91312e756bf89c6bf0de052f68acf1 100644

--- a/third_party/opus/src/src/opus_multistream_encoder.c

+++ b/third_party/opus/src/src/opus_multistream_encoder.c

@@ -87,7 +87,6 @@ struct OpusMSEncoder {

int variable_duration;

MappingType mapping_type;

opus_int32 bitrate_bps;

- float subframe_mem[3];

/* Encoder states go here */

/* then opus_val32 window_mem[channels*120]; */

/* then opus_val32 preemph_mem[channels]; */

@@ -133,6 +132,29 @@ static opus_val32 *ms_get_window_mem(OpusMSEncoder *st)

return (opus_val32*)(void*)ptr;

}

+#ifdef ENABLE_EXPERIMENTAL_AMBISONICS

+static int validate_ambisonics(int nb_channels, int *nb_streams, int *nb_coupled_streams)

+ int order_plus_one;

+ int acn_channels;

+ int nondiegetic_channels;

+ order_plus_one = isqrt32(nb_channels);

+ acn_channels = order_plus_one * order_plus_one;

+ nondiegetic_channels = nb_channels - acn_channels;

+ if (order_plus_one < 1 || order_plus_one > 15 ||

+ (nondiegetic_channels != 0 && nondiegetic_channels != 2))

+ return 0;

+ if (nb_streams)

+ *nb_streams = acn_channels + (nondiegetic_channels != 0);

+ if (nb_coupled_streams)

+ *nb_coupled_streams = nondiegetic_channels != 0;

+ return 1;

+#endif

static int validate_encoder_layout(const ChannelLayout *layout)

{

int s;

@@ -240,6 +262,7 @@ void surround_analysis(const CELTMode *celt_mode, const void *pcm, opus_val16 *b

int pos[8] = {0};

int upsample;

int frame_size;

+ int freq_size;

opus_val16 channel_offset;

opus_val32 bandE[21];

opus_val16 maskLogE[3][21];

@@ -250,6 +273,7 @@ void surround_analysis(const CELTMode *celt_mode, const void *pcm, opus_val16 *b

upsample = resampling_factor(rate);

frame_size = len*upsample;

+ freq_size = IMIN(960, frame_size);

/* LM = log2(frame_size / 120) */

for (LM=0;LM<celt_mode->maxLM;LM++)

@@ -258,7 +282,7 @@ void surround_analysis(const CELTMode *celt_mode, const void *pcm, opus_val16 *b

ALLOC(in, frame_size+overlap, opus_val32);

ALLOC(x, len, opus_val16);

- ALLOC(freq, frame_size, opus_val32);

+ ALLOC(freq, freq_size, opus_val32);

channel_pos(channels, pos);

@@ -268,6 +292,9 @@ void surround_analysis(const CELTMode *celt_mode, const void *pcm, opus_val16 *b

for (c=0;c<channels;c++)

{

+ int frame;

+ int nb_frames = frame_size/freq_size;

+ celt_assert(nb_frames*freq_size == frame_size);

OPUS_COPY(in, mem+c*overlap, overlap);

(*copy_channel_in)(x, 1, pcm, channels, c, len);

celt_preemphasis(x, in+overlap, frame_size, 1, upsample, celt_mode->preemph, preemph_mem+c, 0);

@@ -284,18 +311,26 @@ void surround_analysis(const CELTMode *celt_mode, const void *pcm, opus_val16 *b

}

#endif

- clt_mdct_forward(&celt_mode->mdct, in, freq, celt_mode->window,

- overlap, celt_mode->maxLM-LM, 1, arch);

- if (upsample != 1)

+ OPUS_CLEAR(bandE, 21);

+ for (frame=0;frame<nb_frames;frame++)

{

- int bound = len;

- for (i=0;i<bound;i++)

- freq[i] *= upsample;

- for (;i<frame_size;i++)

- freq[i] = 0;

- }

+ opus_val32 tmpE[21];

+ clt_mdct_forward(&celt_mode->mdct, in+960*frame, freq, celt_mode->window,

+ overlap, celt_mode->maxLM-LM, 1, arch);

+ if (upsample != 1)

+ {

+ int bound = freq_size/upsample;

+ for (i=0;i<bound;i++)

+ freq[i] *= upsample;

+ for (;i<freq_size;i++)

+ freq[i] = 0;

+ }

- compute_band_energies(celt_mode, freq, bandE, 21, 1, LM);

+ compute_band_energies(celt_mode, freq, tmpE, 21, 1, LM, arch);

+ /* If we have multiple frames, take the max energy. */

+ for (i=0;i<21;i++)

+ bandE[i] = MAX32(bandE[i], tmpE[i]);

+ }

amp2Log2(celt_mode, 21, 21, bandE, bandLogE+21*c, 1);

/* Apply spreading function with -6 dB/band going up and -12 dB/band going down. */

for (i=1;i<21;i++)

@@ -411,8 +446,8 @@ opus_int32 opus_multistream_surround_encoder_get_size(int channels, int mapping_

#ifdef ENABLE_EXPERIMENTAL_AMBISONICS

} else if (mapping_family==254)

{

- nb_streams=channels;

- nb_coupled_streams=0;

+ if (!validate_ambisonics(channels, &nb_streams, &nb_coupled_streams))

+ return 0;

#endif

} else

return 0;

@@ -448,7 +483,6 @@ static int opus_multistream_encoder_init_impl(

st->layout.nb_channels = channels;

st->layout.nb_streams = streams;

st->layout.nb_coupled_streams = coupled_streams;

- st->subframe_mem[0]=st->subframe_mem[1]=st->subframe_mem[2]=0;

if (mapping_type != MAPPING_TYPE_SURROUND)

st->lfe_stream = -1;

st->bitrate_bps = OPUS_AUTO;

@@ -456,8 +490,16 @@ static int opus_multistream_encoder_init_impl(

st->variable_duration = OPUS_FRAMESIZE_ARG;

for (i=0;i<st->layout.nb_channels;i++)

st->layout.mapping[i] = mapping[i];

- if (!validate_layout(&st->layout) || !validate_encoder_layout(&st->layout))

+ if (!validate_layout(&st->layout))

return OPUS_BAD_ARG;

+ if (mapping_type == MAPPING_TYPE_SURROUND &&

+ !validate_encoder_layout(&st->layout))

+ return OPUS_BAD_ARG;

+#ifdef ENABLE_EXPERIMENTAL_AMBISONICS

+ if (mapping_type == MAPPING_TYPE_AMBISONICS &&

+ !validate_ambisonics(st->layout.nb_channels, NULL, NULL))

+ return OPUS_BAD_ARG;

+#endif

ptr = (char*)st + align(sizeof(OpusMSEncoder));

coupled_size = opus_encoder_get_size(2);

mono_size = opus_encoder_get_size(1);

@@ -553,10 +595,12 @@ int opus_multistream_surround_encoder_init(

} else if (mapping_family==254)

{

int i;

- *streams=channels;

- *coupled_streams=0;

- for(i=0;i<channels;i++)

- mapping[i] = i;

+ if (!validate_ambisonics(channels, streams, coupled_streams))

+ return OPUS_BAD_ARG;

+ for(i = 0; i < (*streams - *coupled_streams); i++)

+ mapping[i] = i + (*coupled_streams * 2);

+ for(i = 0; i < *coupled_streams * 2; i++)

+ mapping[i + (*streams - *coupled_streams)] = i;

#endif

} else

return OPUS_UNIMPLEMENTED;

@@ -672,58 +716,59 @@ static void surround_rate_allocation(

int lfe_offset;

int coupled_ratio; /* Q8 */

int lfe_ratio; /* Q8 */

+ int nb_lfe;

+ int nb_uncoupled;

+ int nb_coupled;

+ int nb_normal;

+ opus_int32 channel_offset;

+ opus_int32 bitrate;

+ int total;

+ nb_lfe = (st->lfe_stream!=-1);

+ nb_coupled = st->layout.nb_coupled_streams;

+ nb_uncoupled = st->layout.nb_streams-nb_coupled-nb_lfe;

+ nb_normal = 2*nb_coupled + nb_uncoupled;

+ /* Give each non-LFE channel enough bits per channel for coding band energy. */

+ channel_offset = 40*IMAX(50, Fs/frame_size);

- if (st->bitrate_bps > st->layout.nb_channels*40000)

- stream_offset = 20000;

- else

- stream_offset = st->bitrate_bps/st->layout.nb_channels/2;

- stream_offset += 60*(Fs/frame_size-50);

- /* We start by giving each stream (coupled or uncoupled) the same bitrate.

- This models the main saving of coupled channels over uncoupled. */

- /* The LFE stream is an exception to the above and gets fewer bits. */

- lfe_offset = 3500 + 60*(Fs/frame_size-50);

- /* Coupled streams get twice the mono rate after the first 20 kb/s. */

- coupled_ratio = 512;

- /* Should depend on the bitrate, for now we assume LFE gets 1/8 the bits of mono */

- lfe_ratio = 32;

- /* Compute bitrate allocation between streams */

if (st->bitrate_bps==OPUS_AUTO)

{

- channel_rate = Fs+60*Fs/frame_size;

+ bitrate = nb_normal*(channel_offset + Fs + 10000) + 8000*nb_lfe;

} else if (st->bitrate_bps==OPUS_BITRATE_MAX)

{

- channel_rate = 300000;

+ bitrate = nb_normal*300000 + nb_lfe*128000;

} else {

- int nb_lfe;

- int nb_uncoupled;

- int nb_coupled;

- int total;

- nb_lfe = (st->lfe_stream!=-1);

- nb_coupled = st->layout.nb_coupled_streams;

- nb_uncoupled = st->layout.nb_streams-nb_coupled-nb_lfe;

- total = (nb_uncoupled<<8) /* mono */

- + coupled_ratio*nb_coupled /* stereo */

- + nb_lfe*lfe_ratio;

- channel_rate = 256*(st->bitrate_bps-lfe_offset*nb_lfe-stream_offset*(nb_coupled+nb_uncoupled))/total;

+ bitrate = st->bitrate_bps;

}

-#ifndef FIXED_POINT

- if (st->variable_duration==OPUS_FRAMESIZE_VARIABLE && frame_size != Fs/50)

- {

- opus_int32 bonus;

- bonus = 60*(Fs/frame_size-50);

- channel_rate += bonus;

- }

-#endif

+ /* Give LFE some basic stream_channel allocation but never exceed 1/20 of the

+ total rate for the non-energy part to avoid problems at really low rate. */

+ lfe_offset = IMIN(bitrate/20, 3000) + 15*IMAX(50, Fs/frame_size);

+ /* We give each stream (coupled or uncoupled) a starting bitrate.

+ This models the main saving of coupled channels over uncoupled. */

+ stream_offset = (bitrate - channel_offset*nb_normal - lfe_offset*nb_lfe)/nb_normal/2;

+ stream_offset = IMAX(0, IMIN(20000, stream_offset));

+ /* Coupled streams get twice the mono rate after the offset is allocated. */

+ coupled_ratio = 512;

+ /* Should depend on the bitrate, for now we assume LFE gets 1/8 the bits of mono */

+ lfe_ratio = 32;

+ total = (nb_uncoupled<<8) /* mono */

+ + coupled_ratio*nb_coupled /* stereo */

+ + nb_lfe*lfe_ratio;

+ channel_rate = 256*(opus_int64)(bitrate - lfe_offset*nb_lfe - stream_offset*(nb_coupled+nb_uncoupled) - channel_offset*nb_normal)/total;

for (i=0;i<st->layout.nb_streams;i++)

{

if (i<st->layout.nb_coupled_streams)

- rate[i] = stream_offset+(channel_rate*coupled_ratio>>8);

+ rate[i] = 2*channel_offset + IMAX(0, stream_offset+(channel_rate*coupled_ratio>>8));

else if (i!=st->lfe_stream)

- rate[i] = stream_offset+channel_rate;

+ rate[i] = channel_offset + IMAX(0, stream_offset + channel_rate);

else

- rate[i] = lfe_offset+(channel_rate*lfe_ratio>>8);

+ rate[i] = IMAX(0, lfe_offset+(channel_rate*lfe_ratio>>8));

}

@@ -736,47 +781,72 @@ static void ambisonics_rate_allocation(

)

{

int i;

- int non_mono_rate;

int total_rate;

+ int directional_rate;

+ int nondirectional_rate;

+ int leftover_bits;

- /* The mono channel gets (rate_ratio_num / rate_ratio_den) times as many bits

- * as all other channels */

+ /* Each nondirectional channel gets (rate_ratio_num / rate_ratio_den) times

+ * as many bits as all other ambisonics channels.

+ */

const int rate_ratio_num = 4;

const int rate_ratio_den = 3;

- const int num_channels = st->layout.nb_streams;

+ const int nb_channels = st->layout.nb_streams + st->layout.nb_coupled_streams;

+ const int nb_nondirectional_channels = st->layout.nb_coupled_streams * 2 + 1;

+ const int nb_directional_channels = st->layout.nb_streams - 1;

if (st->bitrate_bps==OPUS_AUTO)

{

- total_rate = num_channels * (20000 + st->layout.nb_streams*(Fs+60*Fs/frame_size));

+ total_rate = (st->layout.nb_coupled_streams + st->layout.nb_streams) *

+ (Fs+60*Fs/frame_size) + st->layout.nb_streams * 15000;

} else if (st->bitrate_bps==OPUS_BITRATE_MAX)

{

- total_rate = num_channels * 320000;

- } else {

+ total_rate = nb_channels * 320000;

+ } else

+ {

total_rate = st->bitrate_bps;

}

- /* Let y be the non-mono rate and let p, q be integers such that the mono

- * channel rate is (p/q) * y.

+ /* Let y be the directional rate, m be the num of nondirectional channels

+ * m = (s + 1)

+ * and let p, q be integers such that the nondirectional rate is

+ * m_rate = (p / q) * y

* Also let T be the total bitrate to allocate. Then

- * (n - 1) y + (p/q) y = T

- * y = (T q) / (qn - q + p)

+ * T = (n - m) * y + m * m_rate

+ * Solving for y,

+ * y = (q * T) / (m * (p - q) + n * q)

- non_mono_rate =

- total_rate * rate_ratio_den

- / (rate_ratio_den*num_channels + rate_ratio_num - rate_ratio_den);

+ directional_rate =

+ total_rate * rate_ratio_den

+ / (nb_nondirectional_channels * (rate_ratio_num - rate_ratio_den)

+ + nb_channels * rate_ratio_den);

-#ifndef FIXED_POINT

- if (st->variable_duration==OPUS_FRAMESIZE_VARIABLE && frame_size != Fs/50)

- {

- opus_int32 bonus = 60*(Fs/frame_size-50);

- non_mono_rate += bonus;

- }

-#endif

+ /* Calculate the nondirectional rate.

+ * m_rate = y * (p / q)

+ */

+ nondirectional_rate = directional_rate * rate_ratio_num / rate_ratio_den;

- rate[0] = total_rate - (num_channels - 1) * non_mono_rate;

- for (i=1;i<st->layout.nb_streams;i++)

+ /* Calculate the leftover from truncation error.

+ * leftover = T - y * (n - m) - m_rate * m

+ * Place leftover bits in omnidirectional channel.

+ */

+ leftover_bits = total_rate

+ - directional_rate * nb_directional_channels

+ - nondirectional_rate * nb_nondirectional_channels;

+ /* Calculate rates for each channel */

+ for (i = 0; i < st->layout.nb_streams; i++)

{

- rate[i] = non_mono_rate;

+ if (i < st->layout.nb_coupled_streams)

+ {

+ rate[i] = nondirectional_rate * 2;

+ } else if (i == st->layout.nb_coupled_streams)

+ {

+ rate[i] = nondirectional_rate + leftover_bits;

+ } else

+ {

+ rate[i] = directional_rate;

+ }

}

#endif /* ENABLE_EXPERIMENTAL_AMBISONICS */

@@ -812,8 +882,8 @@ static opus_int32 rate_allocation(

return rate_sum;

}

-/* Max size in case the encoder decides to return three frames */

-#define MS_FRAME_TMP (3*1275+7)

+/* Max size in case the encoder decides to return six frames (6 x 20 ms = 120 ms) */

+#define MS_FRAME_TMP (6*1275+12)

static int opus_multistream_encode_native

(

OpusMSEncoder *st,

@@ -859,32 +929,8 @@ static int opus_multistream_encode_native

opus_encoder_ctl((OpusEncoder*)ptr, OPUS_GET_VBR(&vbr));

opus_encoder_ctl((OpusEncoder*)ptr, CELT_GET_MODE(&celt_mode));

- {

- opus_int32 delay_compensation;

- int channels;

- channels = st->layout.nb_streams + st->layout.nb_coupled_streams;

- opus_encoder_ctl((OpusEncoder*)ptr, OPUS_GET_LOOKAHEAD(&delay_compensation));

- delay_compensation -= Fs/400;

- frame_size = compute_frame_size(pcm, analysis_frame_size,

- st->variable_duration, channels, Fs, st->bitrate_bps,

- delay_compensation, downmix

-#ifndef DISABLE_FLOAT_API

- , st->subframe_mem

-#endif

- );

- }

- if (400*frame_size < Fs)

- {

- RESTORE_STACK;

- return OPUS_BAD_ARG;

- }

- /* Validate frame_size before using it to allocate stack space.

- This mirrors the checks in opus_encode[_float](). */

- if (400*frame_size != Fs && 200*frame_size != Fs &&

- 100*frame_size != Fs && 50*frame_size != Fs &&

- 25*frame_size != Fs && 50*frame_size != 3*Fs)

+ frame_size = frame_size_select(analysis_frame_size, st->variable_duration, Fs);

+ if (frame_size <= 0)

{

RESTORE_STACK;

return OPUS_BAD_ARG;

@@ -892,6 +938,9 @@ static int opus_multistream_encode_native

/* Smallest packet the encoder can produce. */

smallest_packet = st->layout.nb_streams*2-1;

+ /* 100 ms needs an extra byte per stream for the ToC. */

+ if (Fs/frame_size == 10)

+ smallest_packet += st->layout.nb_streams;

if (max_data_bytes < smallest_packet)

{

RESTORE_STACK;

@@ -1013,6 +1062,9 @@ static int opus_multistream_encode_native

curr_max = max_data_bytes - tot_size;

/* Reserve one byte for the last stream and two for the others */

curr_max -= IMAX(0,2*(st->layout.nb_streams-s-1)-1);

+ /* For 100 ms, reserve an extra byte per stream for the ToC */

+ if (Fs/frame_size == 10)

+ curr_max -= st->layout.nb_streams-s-1;

curr_max = IMIN(curr_max,MS_FRAME_TMP);

/* Repacketizer will add one or two bytes for self-delimited frames */

if (s != st->layout.nb_streams-1) curr_max -= curr_max>253 ? 2 : 1;

@@ -1161,9 +1213,11 @@ int opus_multistream_encoder_ctl(OpusMSEncoder *st, int request, ...)

case OPUS_SET_BITRATE_REQUEST:

{

opus_int32 value = va_arg(ap, opus_int32);

- if (value<0 && value!=OPUS_AUTO && value!=OPUS_BITRATE_MAX)

+ if (value != OPUS_AUTO && value != OPUS_BITRATE_MAX)

{

- goto bad_arg;

+ if (value <= 0)

+ goto bad_arg;

+ value = IMIN(300000*st->layout.nb_channels, IMAX(500*st->layout.nb_channels, value));

}

st->bitrate_bps = value;

}

@@ -1206,6 +1260,7 @@ int opus_multistream_encoder_ctl(OpusMSEncoder *st, int request, ...)

case OPUS_GET_INBAND_FEC_REQUEST:

case OPUS_GET_FORCE_CHANNELS_REQUEST:

case OPUS_GET_PREDICTION_DISABLED_REQUEST:

+ case OPUS_GET_PHASE_INVERSION_DISABLED_REQUEST:

{

OpusEncoder *enc;

/* For int32* GET params, just query the first stream */

@@ -1252,6 +1307,7 @@ int opus_multistream_encoder_ctl(OpusMSEncoder *st, int request, ...)

case OPUS_SET_FORCE_MODE_REQUEST:

case OPUS_SET_FORCE_CHANNELS_REQUEST:

case OPUS_SET_PREDICTION_DISABLED_REQUEST:

+ case OPUS_SET_PHASE_INVERSION_DISABLED_REQUEST:

{

int s;

/* This works for int32 params */

@@ -1313,7 +1369,6 @@ int opus_multistream_encoder_ctl(OpusMSEncoder *st, int request, ...)

case OPUS_RESET_STATE:

{

int s;

- st->subframe_mem[0] = st->subframe_mem[1] = st->subframe_mem[2] = 0;

if (st->mapping_type == MAPPING_TYPE_SURROUND)

{

OPUS_CLEAR(ms_get_preemph_mem(st), st->layout.nb_channels);

« no previous file with comments | « third_party/opus/src/src/opus_multistream_decoder.c ('k') | third_party/opus/src/src/opus_private.h » ('j') | no next file with comments »