Fix bandwith vs. bandwiDth typo.

[frescor/ffmpeg.git] / libavcodec / qcelpdec.c
diff --git a/libavcodec/qcelpdec.c b/libavcodec/qcelpdec.c

index 740fd3458155be2f19d8f577f3a20ef2939f7459..bf2381503a0a3f54f4f1ceef0c43d85282e9d247 100644 (file)
--- a/libavcodec/qcelpdec.c
+++ b/libavcodec/qcelpdec.c
@@ -20,21 +20,24 @@
   */
  
  /**
- * @file qcelpdec.c
+ * @file libavcodec/qcelpdec.c
   * QCELP decoder
   * @author Reynaldo H. Verdejo Pinochet
   * @remark FFmpeg merging spearheaded by Kenan Gillet
+ * @remark Development mentored by Benjamin Larson
   */
  
  #include <stddef.h>
  
  #include "avcodec.h"
-#include "bitstream.h"
+#include "internal.h"
+#include "get_bits.h"
  
  #include "qcelpdata.h"
  
  #include "celp_math.h"
  #include "celp_filters.h"
+#include "acelp_vectors.h"
  
  #undef NDEBUG
  #include <assert.h>
@@ -58,7 +61,7 @@ typedef struct
      uint8_t  erasure_count;
      uint8_t  octave_count;      /*!< count the consecutive RATE_OCTAVE frames */
      float    prev_lspf[10];
-    float    predictor_lspf[10];/*!< LSP predictor, only use for RATE_OCTAVE and I_F_Q */
+    float    predictor_lspf[10];/*!< LSP predictor for RATE_OCTAVE and I_F_Q */
      float    pitch_synthesis_filter_mem[303];
      float    pitch_pre_filter_mem[303];
      float    rnd_fir_filter_mem[180];
@@ -69,6 +72,7 @@ typedef struct
      float    pitch_gain[4];
      uint8_t  pitch_lag[4];
      uint16_t first16bits;
+    uint8_t  warned_buf_mismatch_bitrate;
  } QCELPContext;
  
  /**
@@ -76,18 +80,7 @@ typedef struct
   *
   * TIA/EIA/IS-733 2.4.3.3.5
   */
-void ff_qcelp_lspf2lpc(const float *lspf, float *lpc);
-
-static void weighted_vector_sumf(float *out, const float *in_a,
-                                 const float *in_b, float weight_coeff_a,
-                                 float weight_coeff_b, int length)
-{
-    int i;
-
-    for(i=0; i<length; i++)
-        out[i] = weight_coeff_a * in_a[i]
-               + weight_coeff_b * in_b[i];
-}
+void ff_celp_lspf2lpc(const double *lspf, float *lpc);
  
  /**
   * Initialize the speech codec according to the specification.
@@ -171,7 +164,7 @@ static int decode_lspf(QCELPContext *q, float *lspf)
              lspf[i-1] = FFMIN(lspf[i-1], (lspf[i] - QCELP_LSP_SPREAD_FACTOR));
  
          // Low-pass filter the LSP frequencies.
-        weighted_vector_sumf(lspf, lspf, q->prev_lspf, smooth, 1.0-smooth, 10);
+        ff_weighted_vector_sumf(lspf, lspf, q->prev_lspf, smooth, 1.0-smooth, 10);
      }else
      {
          q->octave_count = 0;
@@ -256,7 +249,7 @@ static void decode_gain_and_index(QCELPContext  *q,
              gain[2] =     gain[1];
              gain[1] = 0.6*gain[0] + 0.4*gain[1];
          }
-    }else
+    }else if (q->bitrate != SILENCE)
      {
          if(q->bitrate == RATE_OCTAVE)
          {
@@ -336,7 +329,7 @@ static int codebook_sanity_check_for_rate_quarter(const uint8_t *cbgain)
   * @param gain array holding the 4 pitch subframe gain values
   * @param cdn_vector array for the generated scaled codebook vector
   */
-static void compute_svector(const QCELPContext *q, const float *gain,
+static void compute_svector(QCELPContext *q, const float *gain,
                              float *cdn_vector)
  {
      int      i, j, k;
@@ -412,22 +405,46 @@ static void compute_svector(const QCELPContext *q, const float *gain,
                      *cdn_vector++ = tmp_gain * qcelp_rate_full_codebook[cbseed++ & 127];
              }
          break;
+        case SILENCE:
+            memset(cdn_vector, 0, 160 * sizeof(float));
+        break;
      }
  }
  
  /**
- * Apply generic gain control.
+ * Compute the gain control
   *
- * @param v_out output vector
   * @param v_in gain-controlled vector
   * @param v_ref vector to control gain of
   *
+ * @return gain control
+ *
   * FIXME: If v_ref is a zero vector, it energy is zero
   *        and the behavior of the gain control is
   *        undefined in the specs.
   *
   * TIA/EIA/IS-733 2.4.8.3-2/3/4/5, 2.4.8.6
   */
+static float compute_gain_ctrl(const float *v_ref, const float *v_in, const int len)
+{
+    float scalefactor = ff_dot_productf(v_in, v_in, len);
+
+    if(scalefactor)
+        scalefactor = sqrt(ff_dot_productf(v_ref, v_ref, len) / scalefactor);
+    else
+        ff_log_missing_feature(NULL, "Zero energy for gain control", 1);
+    return scalefactor;
+}
+
+/**
+ * Apply generic gain control.
+ *
+ * @param v_out output vector
+ * @param v_in gain-controlled vector
+ * @param v_ref vector to control gain of
+ *
+ * TIA/EIA/IS-733 2.4.8.3, 2.4.8.6
+ */
  static void apply_gain_ctrl(float *v_out, const float *v_ref,
                              const float *v_in)
  {
@@ -436,12 +453,7 @@ static void apply_gain_ctrl(float *v_out, const float *v_ref,
  
      for(i=0, j=0; i<4; i++)
      {
-        scalefactor = ff_dot_productf(v_in + j, v_in + j, 40);
-        if(scalefactor)
-            scalefactor = sqrt(ff_dot_productf(v_ref + j, v_ref + j, 40)
-                        / scalefactor);
-        else
-            av_log_missing_feature(NULL, "Zero energy for gain control", 1);
+        scalefactor = compute_gain_ctrl(v_ref + j, v_in + j, 40);
          for(len=j+40; j<len; j++)
              v_out[j] = scalefactor * v_in[j];
      }
@@ -507,7 +519,7 @@ static const float *do_pitchfilter(float memory[303], const float v_in[160],
  
  /**
   * Apply pitch synthesis filter and pitch prefilter to the scaled codebook vector.
- * TIA/EIA/IS-733 2.4.5.2
+ * TIA/EIA/IS-733 2.4.5.2, 2.4.8.7.2
   *
   * @param q the context
   * @param cdn_vector the scaled codebook vector
@@ -518,6 +530,7 @@ static void apply_pitch_filters(QCELPContext *q, float *cdn_vector)
      const float *v_synthesis_filtered, *v_pre_filtered;
  
      if(q->bitrate >= RATE_HALF ||
+       q->bitrate == SILENCE ||
         (q->bitrate == I_F_Q && (q->prev_bitrate >= RATE_HALF)))
      {
  
@@ -533,7 +546,19 @@ static void apply_pitch_filters(QCELPContext *q, float *cdn_vector)
              }
          }else
          {
-            float max_pitch_gain = q->erasure_count < 3 ? 0.9 - 0.3 * (q->erasure_count - 1) : 0.0;
+            float max_pitch_gain;
+
+            if (q->bitrate == I_F_Q)
+            {
+                  if (q->erasure_count < 3)
+                      max_pitch_gain = 0.9 - 0.3 * (q->erasure_count - 1);
+                  else
+                      max_pitch_gain = 0.0;
+            }else
+            {
+                assert(q->bitrate == SILENCE);
+                max_pitch_gain = 1.0;
+            }
              for(i=0; i<4; i++)
                  q->pitch_gain[i] = FFMIN(q->pitch_gain[i], max_pitch_gain);
  
@@ -565,11 +590,41 @@ static void apply_pitch_filters(QCELPContext *q, float *cdn_vector)
      }
  }
  
+/**
+ * Reconstructs LPC coefficients from the line spectral pair frequencies
+ * and performs bandwidth expansion.
+ *
+ * @param lspf line spectral pair frequencies
+ * @param lpc linear predictive coding coefficients
+ *
+ * @note: bandwidth_expansion_coeff could be precalculated into a table
+ *        but it seems to be slower on x86
+ *
+ * TIA/EIA/IS-733 2.4.3.3.5
+ */
+static void lspf2lpc(const float *lspf, float *lpc)
+{
+    double lsf[10];
+    double bandwidth_expansion_coeff = QCELP_BANDWIDTH_EXPANSION_COEFF;
+    int   i;
+
+    for (i=0; i<10; i++)
+        lsf[i] = cos(M_PI * lspf[i]);
+
+    ff_celp_lspf2lpc(lsf, lpc);
+
+    for (i=0; i<10; i++)
+    {
+        lpc[i] *= bandwidth_expansion_coeff;
+        bandwidth_expansion_coeff *= QCELP_BANDWIDTH_EXPANSION_COEFF;
+    }
+}
+
  /**
   * Interpolates LSP frequencies and computes LPC coefficients
   * for a given bitrate & pitch subframe.
   *
- * TIA/EIA/IS-733 2.4.3.3.4
+ * TIA/EIA/IS-733 2.4.3.3.4, 2.4.8.7.2
   *
   * @param q the context
   * @param curr_lspf LSP frequencies vector of the current frame
@@ -591,15 +646,17 @@ void interpolate_lpc(QCELPContext *q, const float *curr_lspf, float *lpc,
  
      if(weight != 1.0)
      {
-        weighted_vector_sumf(interpolated_lspf, curr_lspf, q->prev_lspf,
-                             weight, 1.0 - weight, 10);
-        ff_qcelp_lspf2lpc(interpolated_lspf, lpc);
+        ff_weighted_vector_sumf(interpolated_lspf, curr_lspf, q->prev_lspf,
+                                weight, 1.0 - weight, 10);
+        lspf2lpc(interpolated_lspf, lpc);
      }else if(q->bitrate >= RATE_QUARTER ||
               (q->bitrate == I_F_Q && !subframe_num))
-        ff_qcelp_lspf2lpc(curr_lspf, lpc);
+        lspf2lpc(curr_lspf, lpc);
+    else if(q->bitrate == SILENCE && !subframe_num)
+        lspf2lpc(q->prev_lspf, lpc);
  }
  
-static int buf_size2bitrate(const int buf_size)
+static qcelp_packet_rate buf_size2bitrate(const int buf_size)
  {
      switch(buf_size)
      {
@@ -610,7 +667,7 @@ static int buf_size2bitrate(const int buf_size)
          case  1: return SILENCE;
      }
  
-    return -1;
+    return I_F_Q;
  }
  
  /**
@@ -625,8 +682,8 @@ static int buf_size2bitrate(const int buf_size)
   *
   * TIA/EIA/IS-733 2.4.8.7.1
   */
-static int determine_bitrate(AVCodecContext *avctx, const int buf_size,
-                             uint8_t **buf)
+static qcelp_packet_rate determine_bitrate(AVCodecContext *avctx, const int buf_size,
+                             const uint8_t **buf)
  {
      qcelp_packet_rate bitrate;
  
@@ -634,8 +691,13 @@ static int determine_bitrate(AVCodecContext *avctx, const int buf_size,
      {
          if(bitrate > **buf)
          {
+            QCELPContext *q = avctx->priv_data;
+            if (!q->warned_buf_mismatch_bitrate)
+            {
              av_log(avctx, AV_LOG_WARNING,
                     "Claimed bitrate and buffer size mismatch.\n");
+                q->warned_buf_mismatch_bitrate = 1;
+            }
              bitrate = **buf;
          }else if(bitrate < **buf)
          {
@@ -653,9 +715,8 @@ static int determine_bitrate(AVCodecContext *avctx, const int buf_size,
  
      if(bitrate == SILENCE)
      {
-        // FIXME: the decoder should not handle SILENCE frames as I_F_Q frames
-        av_log_missing_feature(avctx, "Blank frame", 1);
-        bitrate = I_F_Q;
+        //FIXME: Remove experimental warning when tested with samples.
+        ff_log_ask_for_sample(avctx, "'Blank frame handling is experimental.");
      }
      return bitrate;
  }
@@ -668,8 +729,10 @@ static void warn_insufficient_frame_quality(AVCodecContext *avctx,
  }
  
  static int qcelp_decode_frame(AVCodecContext *avctx, void *data, int *data_size,
-                              uint8_t *buf, const int buf_size)
+                              AVPacket *avpkt)
  {
+    const uint8_t *buf = avpkt->data;
+    int buf_size = avpkt->size;
      QCELPContext *q = avctx->priv_data;
      float *outbuffer = data;
      int   i;