diff mbox series

[FFmpeg-devel] opusdec: do not fail when LBRR frames are present

Message ID 20200911173714.23073-1-anton@khirnov.net
State Accepted
Headers show
Series [FFmpeg-devel] opusdec: do not fail when LBRR frames are present | expand

Checks

Context Check Description
andriy/default pending
andriy/make success Make finished
andriy/make_fate success Make fate finished

Commit Message

Anton Khirnov Sept. 11, 2020, 5:37 p.m. UTC
Decode and discard them.

Fixes ticket 4641.
---
 libavcodec/opus_silk.c | 28 ++++++++++++++++++++--------
 libavcodec/opustab.c   |  3 +++
 libavcodec/opustab.h   |  3 +++
 3 files changed, 26 insertions(+), 8 deletions(-)

Comments

Lynne Sept. 11, 2020, 6:53 p.m. UTC | #1
On 11/09/2020 19:37, Anton Khirnov wrote:
> Decode and discard them.
> 
> Fixes ticket 4641.
> ---
>  libavcodec/opus_silk.c | 28 ++++++++++++++++++++--------
>  libavcodec/opustab.c   |  3 +++
>  libavcodec/opustab.h   |  3 +++
>  3 files changed, 26 insertions(+), 8 deletions(-)
> 
> diff --git a/libavcodec/opus_silk.c b/libavcodec/opus_silk.c
> index 2fcbf3b9d3..c683b25a20 100644
> --- a/libavcodec/opus_silk.c
> +++ b/libavcodec/opus_silk.c
> @@ -506,7 +506,8 @@ static inline void silk_decode_excitation(SilkContext *s, OpusRangeCoder *rc,
>  #define LTP_ORDER 5
>  
>  static void silk_decode_frame(SilkContext *s, OpusRangeCoder *rc,
> -                              int frame_num, int channel, int coded_channels, int active, int active1)
> +                              int frame_num, int channel, int coded_channels,
> +                              int active, int active1, int redundant)
>  {
>      /* per frame */
>      int voiced;       // combines with active to indicate inactive, active, or active+voiced
> @@ -665,8 +666,8 @@ static void silk_decode_frame(SilkContext *s, OpusRangeCoder *rc,
>      silk_decode_excitation(s, rc, residual + SILK_MAX_LAG, qoffset_high,
>                             active, voiced);
>  
> -    /* skip synthesising the side channel if we want mono-only */
> -    if (s->output_channels == channel)
> +    /* skip synthesising the output if we do not need it */
> +    if (s->output_channels == channel || redundant)
>          return;

Maybe add a small TODO in the comment to actually implement error recovery?


>  
>      /* generate the output signal */
> @@ -814,15 +815,26 @@ int ff_silk_decode_superframe(SilkContext *s, OpusRangeCoder *rc,
>              active[i][j] = ff_opus_rc_dec_log(rc, 1);
>  
>          redundancy[i] = ff_opus_rc_dec_log(rc, 1);
> -        if (redundancy[i]) {
> -            avpriv_report_missing_feature(s->avctx, "LBRR frames");
> -            return AVERROR_PATCHWELCOME;
> -        }
>      }
>  
> +    /* read the per-frame LBRR flags */
> +    for (i = 0; i < coded_channels; i++)
> +        if (redundancy[i] && duration_ms > 20) {
> +            redundancy[i] = ff_opus_rc_dec_cdf(rc, duration_ms == 40 ?
> +                                                   ff_silk_model_lbrr_flags_40 : ff_silk_model_lbrr_flags_60);
> +        }
> +
> +    /* decode the LBRR frames */
> +    for (i = 0; i < nb_frames; i++)
> +        for (j = 0; j < coded_channels; j++)
> +            if (redundancy[j] & (1 << i)) {
> +                int active1 = (j == 0 && !(redundancy[1] & (1 << i))) ? 0 : 1;
> +                silk_decode_frame(s, rc, i, j, coded_channels, 1, active1, 1);
> +            }

nit: add brackets to the nb_frames loop

Apart from that LGTM.

Shouldn't be too difficult to implement proper error recovery in the
future, though it would have to be a setting, because 1-frame delay is
still a 1-frame delay.
Derek Buitenhuis Sept. 13, 2020, 11:52 a.m. UTC | #2
On 11/09/2020 18:37, Anton Khirnov wrote:
> Decode and discard them.
> 
> Fixes ticket 4641.
> ---
>  libavcodec/opus_silk.c | 28 ++++++++++++++++++++--------
>  libavcodec/opustab.c   |  3 +++
>  libavcodec/opustab.h   |  3 +++
>  3 files changed, 26 insertions(+), 8 deletions(-)

I can confirm this also fixes the samples I have at $dayjob.

- Derek
Paul B Mahol Sept. 18, 2020, 8:31 a.m. UTC | #3
On Fri, Sep 11, 2020 at 07:37:14PM +0200, Anton Khirnov wrote:
> Decode and discard them.
> 
> Fixes ticket 4641.
> ---
>  libavcodec/opus_silk.c | 28 ++++++++++++++++++++--------
>  libavcodec/opustab.c   |  3 +++
>  libavcodec/opustab.h   |  3 +++
>  3 files changed, 26 insertions(+), 8 deletions(-)
> 

looks fine.
Anton Khirnov Oct. 1, 2020, 9:18 a.m. UTC | #4
Quoting Lynne (2020-09-11 20:53:16)
> On 11/09/2020 19:37, Anton Khirnov wrote:
> > Decode and discard them.
> > 
> > Fixes ticket 4641.
> > ---
> >  libavcodec/opus_silk.c | 28 ++++++++++++++++++++--------
> >  libavcodec/opustab.c   |  3 +++
> >  libavcodec/opustab.h   |  3 +++
> >  3 files changed, 26 insertions(+), 8 deletions(-)
> > 
> > diff --git a/libavcodec/opus_silk.c b/libavcodec/opus_silk.c
> > index 2fcbf3b9d3..c683b25a20 100644
> > --- a/libavcodec/opus_silk.c
> > +++ b/libavcodec/opus_silk.c
> > @@ -506,7 +506,8 @@ static inline void silk_decode_excitation(SilkContext *s, OpusRangeCoder *rc,
> >  #define LTP_ORDER 5
> >  
> >  static void silk_decode_frame(SilkContext *s, OpusRangeCoder *rc,
> > -                              int frame_num, int channel, int coded_channels, int active, int active1)
> > +                              int frame_num, int channel, int coded_channels,
> > +                              int active, int active1, int redundant)
> >  {
> >      /* per frame */
> >      int voiced;       // combines with active to indicate inactive, active, or active+voiced
> > @@ -665,8 +666,8 @@ static void silk_decode_frame(SilkContext *s, OpusRangeCoder *rc,
> >      silk_decode_excitation(s, rc, residual + SILK_MAX_LAG, qoffset_high,
> >                             active, voiced);
> >  
> > -    /* skip synthesising the side channel if we want mono-only */
> > -    if (s->output_channels == channel)
> > +    /* skip synthesising the output if we do not need it */
> > +    if (s->output_channels == channel || redundant)
> >          return;
> 
> Maybe add a small TODO in the comment to actually implement error recovery?
> 
> 
> >  
> >      /* generate the output signal */
> > @@ -814,15 +815,26 @@ int ff_silk_decode_superframe(SilkContext *s, OpusRangeCoder *rc,
> >              active[i][j] = ff_opus_rc_dec_log(rc, 1);
> >  
> >          redundancy[i] = ff_opus_rc_dec_log(rc, 1);
> > -        if (redundancy[i]) {
> > -            avpriv_report_missing_feature(s->avctx, "LBRR frames");
> > -            return AVERROR_PATCHWELCOME;
> > -        }
> >      }
> >  
> > +    /* read the per-frame LBRR flags */
> > +    for (i = 0; i < coded_channels; i++)
> > +        if (redundancy[i] && duration_ms > 20) {
> > +            redundancy[i] = ff_opus_rc_dec_cdf(rc, duration_ms == 40 ?
> > +                                                   ff_silk_model_lbrr_flags_40 : ff_silk_model_lbrr_flags_60);
> > +        }
> > +
> > +    /* decode the LBRR frames */
> > +    for (i = 0; i < nb_frames; i++)
> > +        for (j = 0; j < coded_channels; j++)
> > +            if (redundancy[j] & (1 << i)) {
> > +                int active1 = (j == 0 && !(redundancy[1] & (1 << i))) ? 0 : 1;
> > +                silk_decode_frame(s, rc, i, j, coded_channels, 1, active1, 1);
> > +            }
> 
> nit: add brackets to the nb_frames loop
> 
> Apart from that LGTM.

Applied comments and pushed
diff mbox series

Patch

diff --git a/libavcodec/opus_silk.c b/libavcodec/opus_silk.c
index 2fcbf3b9d3..c683b25a20 100644
--- a/libavcodec/opus_silk.c
+++ b/libavcodec/opus_silk.c
@@ -506,7 +506,8 @@  static inline void silk_decode_excitation(SilkContext *s, OpusRangeCoder *rc,
 #define LTP_ORDER 5
 
 static void silk_decode_frame(SilkContext *s, OpusRangeCoder *rc,
-                              int frame_num, int channel, int coded_channels, int active, int active1)
+                              int frame_num, int channel, int coded_channels,
+                              int active, int active1, int redundant)
 {
     /* per frame */
     int voiced;       // combines with active to indicate inactive, active, or active+voiced
@@ -665,8 +666,8 @@  static void silk_decode_frame(SilkContext *s, OpusRangeCoder *rc,
     silk_decode_excitation(s, rc, residual + SILK_MAX_LAG, qoffset_high,
                            active, voiced);
 
-    /* skip synthesising the side channel if we want mono-only */
-    if (s->output_channels == channel)
+    /* skip synthesising the output if we do not need it */
+    if (s->output_channels == channel || redundant)
         return;
 
     /* generate the output signal */
@@ -814,15 +815,26 @@  int ff_silk_decode_superframe(SilkContext *s, OpusRangeCoder *rc,
             active[i][j] = ff_opus_rc_dec_log(rc, 1);
 
         redundancy[i] = ff_opus_rc_dec_log(rc, 1);
-        if (redundancy[i]) {
-            avpriv_report_missing_feature(s->avctx, "LBRR frames");
-            return AVERROR_PATCHWELCOME;
-        }
     }
 
+    /* read the per-frame LBRR flags */
+    for (i = 0; i < coded_channels; i++)
+        if (redundancy[i] && duration_ms > 20) {
+            redundancy[i] = ff_opus_rc_dec_cdf(rc, duration_ms == 40 ?
+                                                   ff_silk_model_lbrr_flags_40 : ff_silk_model_lbrr_flags_60);
+        }
+
+    /* decode the LBRR frames */
+    for (i = 0; i < nb_frames; i++)
+        for (j = 0; j < coded_channels; j++)
+            if (redundancy[j] & (1 << i)) {
+                int active1 = (j == 0 && !(redundancy[1] & (1 << i))) ? 0 : 1;
+                silk_decode_frame(s, rc, i, j, coded_channels, 1, active1, 1);
+            }
+
     for (i = 0; i < nb_frames; i++) {
         for (j = 0; j < coded_channels && !s->midonly; j++)
-            silk_decode_frame(s, rc, i, j, coded_channels, active[j][i], active[1][i]);
+            silk_decode_frame(s, rc, i, j, coded_channels, active[j][i], active[1][i], 0);
 
         /* reset the side channel if it is not coded */
         if (s->midonly && s->frame[1].coded)
diff --git a/libavcodec/opustab.c b/libavcodec/opustab.c
index fb340e07e8..64070f8299 100644
--- a/libavcodec/opustab.c
+++ b/libavcodec/opustab.c
@@ -26,6 +26,9 @@  const uint8_t ff_opus_default_coupled_streams[] = { 0, 1, 1, 2, 2, 2, 2, 3 };
 
 const uint8_t ff_celt_band_end[] = { 13, 17, 17, 19, 21 };
 
+const uint16_t ff_silk_model_lbrr_flags_40[] = { 256, 0, 53, 106, 256 };
+const uint16_t ff_silk_model_lbrr_flags_60[] = { 256, 0, 41, 61, 90, 131, 146, 174, 256 };
+
 const uint16_t ff_silk_model_stereo_s1[] = {
     256,   7,   9,  10,  11,  12,  22,  46,  54,  55,  56,  59,  82, 174, 197, 200,
     201, 202, 210, 234, 244, 245, 246, 247, 249, 256
diff --git a/libavcodec/opustab.h b/libavcodec/opustab.h
index bce5a42830..892126bb23 100644
--- a/libavcodec/opustab.h
+++ b/libavcodec/opustab.h
@@ -31,6 +31,9 @@  extern const uint8_t  ff_celt_band_end[];
 
 extern const uint8_t  ff_opus_default_coupled_streams[];
 
+extern const uint16_t ff_silk_model_lbrr_flags_40[];
+extern const uint16_t ff_silk_model_lbrr_flags_60[];
+
 extern const uint16_t ff_silk_model_stereo_s1[];
 extern const uint16_t ff_silk_model_stereo_s2[];
 extern const uint16_t ff_silk_model_stereo_s3[];