aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorThilo Borgmann <thilo.borgmann@googlemail.com>2009-11-14 06:29:19 +0000
committerThilo Borgmann <thilo.borgmann@googlemail.com>2009-11-14 06:29:19 +0000
commit93d38cf6b056b3cfd16fb86e65d6db2deeb34fb7 (patch)
tree772ab51e260850e986ac8b4f21f93473c75015eb
parent7934cbb3be7a03b1ae7a8a30613a7a75b1e28645 (diff)
downloadffmpeg-93d38cf6b056b3cfd16fb86e65d6db2deeb34fb7.tar.gz
Add long-term prediction to the ALS decoder.
Originally committed as revision 20534 to svn://svn.ffmpeg.org/ffmpeg/trunk
-rw-r--r--libavcodec/als_data.h10
-rw-r--r--libavcodec/alsdec.c47
2 files changed, 55 insertions, 2 deletions
diff --git a/libavcodec/als_data.h b/libavcodec/als_data.h
index 8c052cde53..bcde466064 100644
--- a/libavcodec/als_data.h
+++ b/libavcodec/als_data.h
@@ -92,4 +92,14 @@ static const int16_t parcor_scaled_values[] = {
};
+/** Gain values of p(0) for long-term prediction.
+ * To be indexed by the Rice coded indices.
+ */
+static const uint8_t ltp_gain_values [4][4] = {
+ { 0, 8, 16, 24},
+ {32, 40, 48, 56},
+ {64, 70, 76, 82},
+ {88, 92, 96, 100}
+};
+
#endif /* AVCODEC_ALS_DATA_H */
diff --git a/libavcodec/alsdec.c b/libavcodec/alsdec.c
index ebb572dc31..a2f70aabaa 100644
--- a/libavcodec/alsdec.c
+++ b/libavcodec/alsdec.c
@@ -78,6 +78,7 @@ typedef struct {
unsigned int frame_id; ///< the frame ID / number of the current frame
unsigned int js_switch; ///< if true, joint-stereo decoding is enforced
unsigned int num_blocks; ///< number of blocks used in the current frame
+ int ltp_lag_length; ///< number of bits used for ltp lag value
int32_t *quant_cof; ///< quantized parcor coefficients
int32_t *lpc_cof; ///< coefficients of the direct form prediction filter
int32_t *prev_raw_samples; ///< contains unshifted raw samples from the previous block
@@ -270,7 +271,6 @@ static int check_specific_config(ALSDecContext *ctx)
}
MISSING_ERR(sconf->floating, "Floating point decoding", -1);
- MISSING_ERR(sconf->long_term_prediction, "Long-term prediction", -1);
MISSING_ERR(sconf->bgmc, "BGMC entropy decoding", -1);
MISSING_ERR(sconf->mc_coding, "Multi-channel correlation", -1);
MISSING_ERR(sconf->rlslms, "Adaptive RLS-LMS prediction", -1);
@@ -443,6 +443,9 @@ static int read_var_block(ALSDecContext *ctx, unsigned int ra_block,
int smp = 0;
int sb, store_prev_samples;
int64_t y;
+ int use_ltp = 0;
+ int ltp_lag = 0;
+ int ltp_gain[5];
*js_blocks = get_bits1(gb);
@@ -540,7 +543,23 @@ static int read_var_block(ALSDecContext *ctx, unsigned int ra_block,
}
}
- // TODO: LTP mode
+ // read LTP gain and lag values
+ if (sconf->long_term_prediction) {
+ use_ltp = get_bits1(gb);
+
+ if (use_ltp) {
+ ltp_gain[0] = decode_rice(gb, 1) << 3;
+ ltp_gain[1] = decode_rice(gb, 2) << 3;
+
+ ltp_gain[2] = ltp_gain_values[get_unary(gb, 0, 4)][get_bits(gb, 2)];
+
+ ltp_gain[3] = decode_rice(gb, 2) << 3;
+ ltp_gain[4] = decode_rice(gb, 1) << 3;
+
+ ltp_lag = get_bits(gb, ctx->ltp_lag_length);
+ ltp_lag += FFMAX(4, opt_order + 1);
+ }
+ }
// read first value and residuals in case of a random access block
if (ra_block) {
@@ -565,6 +584,26 @@ static int read_var_block(ALSDecContext *ctx, unsigned int ra_block,
*current_res++ = decode_rice(gb, s[sb]);
}
+ // reverse long-term prediction
+ if (use_ltp) {
+ int ltp_smp;
+
+ for (ltp_smp = FFMAX(ltp_lag - 2, 0); ltp_smp < block_length; ltp_smp++) {
+ int center = ltp_smp - ltp_lag;
+ int begin = FFMAX(0, center - 2);
+ int end = center + 3;
+ int tab = 5 - (end - begin);
+ int base;
+
+ y = 1 << 6;
+
+ for (base = begin; base < end; base++, tab++)
+ y += MUL64(ltp_gain[tab], raw_samples[base]);
+
+ raw_samples[ltp_smp] += y >> 7;
+ }
+ }
+
// reconstruct all samples from residuals
if (ra_block) {
for (smp = 0; smp < opt_order; smp++) {
@@ -949,6 +988,10 @@ static av_cold int decode_init(AVCodecContext *avctx)
avctx->bits_per_raw_sample = (sconf->resolution + 1) * 8;
}
+ // set lag value for long-term prediction
+ ctx->ltp_lag_length = 8 + (avctx->sample_rate >= 96000) +
+ (avctx->sample_rate >= 192000);
+
avctx->frame_size = sconf->frame_length;
channel_size = sconf->frame_length + sconf->max_order;