Add long-term prediction to the ALS decoder.

Originally committed as revision 20534 to svn://svn.ffmpeg.org/ffmpeg/trunk
author: Thilo Borgmann <thilo.borgmann@googlemail.com> 2009-11-14 06:29:19 +0000
committer: Thilo Borgmann <thilo.borgmann@googlemail.com> 2009-11-14 06:29:19 +0000
commit: 93d38cf6b056b3cfd16fb86e65d6db2deeb34fb7 (patch)
tree: 772ab51e260850e986ac8b4f21f93473c75015eb
parent: 7934cbb3be7a03b1ae7a8a30613a7a75b1e28645 (diff)
download: ffmpeg-93d38cf6b056b3cfd16fb86e65d6db2deeb34fb7.tar.gz
2 files changed, 55 insertions, 2 deletions
diff --git a/libavcodec/als_data.h b/libavcodec/als_data.h
index 8c052cde53..bcde466064 100644
--- a/libavcodec/als_data.h
+++ b/libavcodec/als_data.h
@@ -92,4 +92,14 @@ static const int16_t parcor_scaled_values[] = {
 };
 
 
+/** Gain values of p(0) for long-term prediction.
+ *  To be indexed by the Rice coded indices.
+ */
+static const uint8_t ltp_gain_values [4][4] = {
+    { 0,  8, 16,  24},
+    {32, 40, 48,  56},
+    {64, 70, 76,  82},
+    {88, 92, 96, 100}
+};
+
 #endif /* AVCODEC_ALS_DATA_H */
diff --git a/libavcodec/alsdec.c b/libavcodec/alsdec.c
index ebb572dc31..a2f70aabaa 100644
--- a/libavcodec/alsdec.c
+++ b/libavcodec/alsdec.c
@@ -78,6 +78,7 @@ typedef struct {
     unsigned int frame_id;          ///< the frame ID / number of the current frame
     unsigned int js_switch;         ///< if true, joint-stereo decoding is enforced
     unsigned int num_blocks;        ///< number of blocks used in the current frame
+    int ltp_lag_length;             ///< number of bits used for ltp lag value
     int32_t *quant_cof;             ///< quantized parcor coefficients
     int32_t *lpc_cof;               ///< coefficients of the direct form prediction filter
     int32_t *prev_raw_samples;      ///< contains unshifted raw samples from the previous block
@@ -270,7 +271,6 @@ static int check_specific_config(ALSDecContext *ctx)
     }
 
     MISSING_ERR(sconf->floating,             "Floating point decoding",     -1);
-    MISSING_ERR(sconf->long_term_prediction, "Long-term prediction",        -1);
     MISSING_ERR(sconf->bgmc,                 "BGMC entropy decoding",       -1);
     MISSING_ERR(sconf->mc_coding,            "Multi-channel correlation",   -1);
     MISSING_ERR(sconf->rlslms,               "Adaptive RLS-LMS prediction", -1);
@@ -443,6 +443,9 @@ static int read_var_block(ALSDecContext *ctx, unsigned int ra_block,
     int          smp        = 0;
     int          sb, store_prev_samples;
     int64_t      y;
+    int          use_ltp    = 0;
+    int          ltp_lag    = 0;
+    int          ltp_gain[5];
 
     *js_blocks  = get_bits1(gb);
 
@@ -540,7 +543,23 @@ static int read_var_block(ALSDecContext *ctx, unsigned int ra_block,
         }
     }
 
-    // TODO: LTP mode
+    // read LTP gain and lag values
+    if (sconf->long_term_prediction) {
+        use_ltp = get_bits1(gb);
+
+        if (use_ltp) {
+            ltp_gain[0]   = decode_rice(gb, 1) << 3;
+            ltp_gain[1]   = decode_rice(gb, 2) << 3;
+
+            ltp_gain[2]   = ltp_gain_values[get_unary(gb, 0, 4)][get_bits(gb, 2)];
+
+            ltp_gain[3]   = decode_rice(gb, 2) << 3;
+            ltp_gain[4]   = decode_rice(gb, 1) << 3;
+
+            ltp_lag       = get_bits(gb, ctx->ltp_lag_length);
+            ltp_lag      += FFMAX(4, opt_order + 1);
+        }
+    }
 
     // read first value and residuals in case of a random access block
     if (ra_block) {
@@ -565,6 +584,26 @@ static int read_var_block(ALSDecContext *ctx, unsigned int ra_block,
                 *current_res++ = decode_rice(gb, s[sb]);
      }
 
+    // reverse long-term prediction
+    if (use_ltp) {
+        int ltp_smp;
+
+        for (ltp_smp = FFMAX(ltp_lag - 2, 0); ltp_smp < block_length; ltp_smp++) {
+            int center = ltp_smp - ltp_lag;
+            int begin  = FFMAX(0, center - 2);
+            int end    = center + 3;
+            int tab    = 5 - (end - begin);
+            int base;
+
+            y = 1 << 6;
+
+            for (base = begin; base < end; base++, tab++)
+                y += MUL64(ltp_gain[tab], raw_samples[base]);
+
+            raw_samples[ltp_smp] += y >> 7;
+        }
+    }
+
     // reconstruct all samples from residuals
     if (ra_block) {
         for (smp = 0; smp < opt_order; smp++) {
@@ -949,6 +988,10 @@ static av_cold int decode_init(AVCodecContext *avctx)
         avctx->bits_per_raw_sample = (sconf->resolution + 1) * 8;
     }
 
+    // set lag value for long-term prediction
+    ctx->ltp_lag_length = 8 + (avctx->sample_rate >=  96000) +
+                              (avctx->sample_rate >= 192000);
+
     avctx->frame_size = sconf->frame_length;
     channel_size      = sconf->frame_length + sconf->max_order;
author	Thilo Borgmann <thilo.borgmann@googlemail.com>	2009-11-14 06:29:19 +0000
committer	Thilo Borgmann <thilo.borgmann@googlemail.com>	2009-11-14 06:29:19 +0000
commit	93d38cf6b056b3cfd16fb86e65d6db2deeb34fb7 (patch)
tree	772ab51e260850e986ac8b4f21f93473c75015eb
parent	7934cbb3be7a03b1ae7a8a30613a7a75b1e28645 (diff)
download	ffmpeg-93d38cf6b056b3cfd16fb86e65d6db2deeb34fb7.tar.gz