FFmpeg
|
AMR narrowband decoder. More...
#include <string.h>
#include <math.h>
#include "libavutil/channel_layout.h"
#include "avcodec.h"
#include "dsputil.h"
#include "libavutil/common.h"
#include "libavutil/avassert.h"
#include "celp_math.h"
#include "celp_filters.h"
#include "acelp_filters.h"
#include "acelp_vectors.h"
#include "acelp_pitch_delay.h"
#include "lsp.h"
#include "amr.h"
#include "internal.h"
#include "amrnbdata.h"
Go to the source code of this file.
Data Structures | |
struct | AMRContext |
Macros | |
#define | AMR_BLOCK_SIZE 160 |
samples per frame | |
#define | AMR_SAMPLE_BOUND 32768.0 |
threshold for synthesis overflow | |
#define | AMR_SAMPLE_SCALE (2.0 / 32768.0) |
Scale from constructed speech to [-1,1]. | |
#define | PRED_FAC_MODE_12k2 0.65 |
Prediction factor for 12.2kbit/s mode. | |
#define | LSF_R_FAC (8000.0 / 32768.0) |
LSF residual tables to Hertz. | |
#define | MIN_LSF_SPACING (50.0488 / 8000.0) |
Ensures stability of LPC filter. | |
#define | PITCH_LAG_MIN_MODE_12k2 18 |
Lower bound on decoded lag search in 12.2kbit/s mode. | |
#define | MIN_ENERGY -14.0 |
Initial energy in dB. | |
#define | SHARP_MAX 0.79449462890625 |
Maximum sharpening factor. | |
#define | AMR_TILT_RESPONSE 22 |
Number of impulse response coefficients used for tilt factor. | |
#define | AMR_TILT_GAMMA_T 0.8 |
Tilt factor = 1st reflection coefficient * gamma_t. | |
#define | AMR_AGC_ALPHA 0.9 |
Adaptive gain control factor used in post-filter. | |
Functions | |
static void | weighted_vector_sumd (double *out, const double *in_a, const double *in_b, double weight_coeff_a, double weight_coeff_b, int length) |
Double version of ff_weighted_vector_sumf() | |
static av_cold int | amrnb_decode_init (AVCodecContext *avctx) |
static enum Mode | unpack_bitstream (AMRContext *p, const uint8_t *buf, int buf_size) |
Unpack an RFC4867 speech frame into the AMR frame mode and parameters. | |
static int | amrnb_decode_frame (AVCodecContext *avctx, void *data, int *got_frame_ptr, AVPacket *avpkt) |
AMR pitch LPC coefficient decoding functions | |
static void | interpolate_lsf (ACELPVContext *ctx, float lsf_q[4][LP_FILTER_ORDER], float *lsf_new) |
Interpolate the LSF vector (used for fixed gain smoothing). | |
static void | lsf2lsp_for_mode12k2 (AMRContext *p, double lsp[LP_FILTER_ORDER], const float lsf_no_r[LP_FILTER_ORDER], const int16_t *lsf_quantizer[5], const int quantizer_offset, const int sign, const int update) |
Decode a set of 5 split-matrix quantized lsf indexes into an lsp vector. | |
static void | lsf2lsp_5 (AMRContext *p) |
Decode a set of 5 split-matrix quantized lsf indexes into 2 lsp vectors. | |
static void | lsf2lsp_3 (AMRContext *p) |
Decode a set of 3 split-matrix quantized lsf indexes into an lsp vector. | |
AMR pitch vector decoding functions | |
static void | decode_pitch_lag_1_6 (int *lag_int, int *lag_frac, int pitch_index, const int prev_lag_int, const int subframe) |
Like ff_decode_pitch_lag(), but with 1/6 resolution. | |
static void | decode_pitch_vector (AMRContext *p, const AMRNBSubframe *amr_subframe, const int subframe) |
AMR algebraic code book (fixed) vector decoding functions | |
static void | decode_10bit_pulse (int code, int pulse_position[8], int i1, int i2, int i3) |
Decode a 10-bit algebraic codebook index from a 10.2 kbit/s frame. | |
static void | decode_8_pulses_31bits (const int16_t *fixed_index, AMRFixed *fixed_sparse) |
Decode the algebraic codebook index to pulse positions and signs and construct the algebraic codebook vector for MODE_10k2. | |
static void | decode_fixed_sparse (AMRFixed *fixed_sparse, const uint16_t *pulses, const enum Mode mode, const int subframe) |
Decode the algebraic codebook index to pulse positions and signs, then construct the algebraic codebook vector. | |
static void | pitch_sharpening (AMRContext *p, int subframe, enum Mode mode, AMRFixed *fixed_sparse) |
Apply pitch lag to obtain the sharpened fixed vector (section 6.1.2) | |
AMR gain decoding functions | |
static float | fixed_gain_smooth (AMRContext *p, const float *lsf, const float *lsf_avg, const enum Mode mode) |
fixed gain smoothing Note that where the spec specifies the "spectrum in the q domain" in section 6.1.4, in fact frequencies should be used. | |
static void | decode_gains (AMRContext *p, const AMRNBSubframe *amr_subframe, const enum Mode mode, const int subframe, float *fixed_gain_factor) |
Decode pitch gain and fixed gain factor (part of section 6.1.3). | |
AMR preprocessing functions | |
static void | apply_ir_filter (float *out, const AMRFixed *in, const float *filter) |
Circularly convolve a sparse fixed vector with a phase dispersion impulse response filter (D.6.2 of G.729 and 6.1.5 of AMR). | |
static const float * | anti_sparseness (AMRContext *p, AMRFixed *fixed_sparse, const float *fixed_vector, float fixed_gain, float *out) |
Reduce fixed vector sparseness by smoothing with one of three IR filters. | |
AMR synthesis functions | |
static int | synthesis (AMRContext *p, float *lpc, float fixed_gain, const float *fixed_vector, float *samples, uint8_t overflow) |
Conduct 10th order linear predictive coding synthesis. | |
AMR update functions | |
static void | update_state (AMRContext *p) |
Update buffers and history at the end of decoding a subframe. | |
AMR Postprocessing functions | |
static float | tilt_factor (AMRContext *p, float *lpc_n, float *lpc_d) |
Get the tilt factor of a formant filter from its transfer function. | |
static void | postfilter (AMRContext *p, float *lpc, float *buf_out) |
Perform adaptive post-filtering to enhance the quality of the speech. | |
Variables | |
AVCodec | ff_amrnb_decoder |
AMR narrowband decoder.
This decoder uses floats for simplicity and so is not bit-exact. One difference is that differences in phase can accumulate. The test sequences in 3GPP TS 26.074 can still be useful.
Definition in file amrnbdec.c.
#define AMR_BLOCK_SIZE 160 |
#define AMR_SAMPLE_BOUND 32768.0 |
threshold for synthesis overflow
Definition at line 63 of file amrnbdec.c.
Referenced by synthesis().
#define AMR_SAMPLE_SCALE (2.0 / 32768.0) |
Scale from constructed speech to [-1,1].
AMR is designed to produce 16-bit PCM samples (3GPP TS 26.090 4.2) but upscales by two (section 6.2.2).
Fundamentally, this scale is determined by energy_mean through the fixed vector contribution to the excitation vector.
Definition at line 74 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
#define PRED_FAC_MODE_12k2 0.65 |
Prediction factor for 12.2kbit/s mode.
Definition at line 77 of file amrnbdec.c.
Referenced by lsf2lsp_5().
#define LSF_R_FAC (8000.0 / 32768.0) |
LSF residual tables to Hertz.
Definition at line 79 of file amrnbdec.c.
Referenced by lsf2lsp_3(), lsf2lsp_5(), and lsf2lsp_for_mode12k2().
#define MIN_LSF_SPACING (50.0488 / 8000.0) |
Ensures stability of LPC filter.
Definition at line 80 of file amrnbdec.c.
Referenced by lsf2lsp_3(), and lsf2lsp_for_mode12k2().
#define PITCH_LAG_MIN_MODE_12k2 18 |
Lower bound on decoded lag search in 12.2kbit/s mode.
Definition at line 81 of file amrnbdec.c.
Referenced by decode_pitch_lag_1_6().
#define MIN_ENERGY -14.0 |
Initial energy in dB.
Also used for bad frames (unimplemented).
Definition at line 84 of file amrnbdec.c.
Referenced by amrnb_decode_init(), and amrwb_decode_init().
#define SHARP_MAX 0.79449462890625 |
Maximum sharpening factor.
The specification says 0.8, which should be 13107, but the reference C code uses 13017 instead. (Amusingly the same applies to SHARP_MAX in g729dec.c.)
Definition at line 91 of file amrnbdec.c.
Referenced by pitch_sharpening(), and synthesis().
#define AMR_TILT_RESPONSE 22 |
Number of impulse response coefficients used for tilt factor.
Definition at line 94 of file amrnbdec.c.
Referenced by tilt_factor().
#define AMR_TILT_GAMMA_T 0.8 |
Tilt factor = 1st reflection coefficient * gamma_t.
Definition at line 96 of file amrnbdec.c.
Referenced by tilt_factor().
#define AMR_AGC_ALPHA 0.9 |
Adaptive gain control factor used in post-filter.
Definition at line 98 of file amrnbdec.c.
Referenced by postfilter().
|
static |
Double version of ff_weighted_vector_sumf()
Definition at line 150 of file amrnbdec.c.
Referenced by lsf2lsp_5().
|
static |
Definition at line 161 of file amrnbdec.c.
|
static |
Unpack an RFC4867 speech frame into the AMR frame mode and parameters.
The order of speech bits is specified by 3GPP TS 26.101.
p | the context |
buf | pointer to the input buffer |
buf_size | size of the input buffer |
Definition at line 211 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Interpolate the LSF vector (used for fixed gain smoothing).
The interpolation is done over all four subframes even in MODE_12k2.
[in] | ctx | The Context |
[in,out] | lsf_q | LSFs in [0,1] for each subframe |
[in] | lsf_new | New LSFs in [0,1] for subframe 4 |
Definition at line 243 of file amrnbdec.c.
Referenced by lsf2lsp_3(), and lsf2lsp_for_mode12k2().
|
static |
Decode a set of 5 split-matrix quantized lsf indexes into an lsp vector.
p | the context |
lsp | output LSP vector |
lsf_no_r | LSF vector without the residual vector added |
lsf_quantizer | pointers to LSF dictionary tables |
quantizer_offset | offset in tables |
sign | for the 3 dictionary table |
update | store data for computing the next frame's LSFs |
Definition at line 264 of file amrnbdec.c.
Referenced by lsf2lsp_5().
|
static |
Decode a set of 5 split-matrix quantized lsf indexes into 2 lsp vectors.
p | pointer to the AMRContext |
Definition at line 302 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Decode a set of 3 split-matrix quantized lsf indexes into an lsp vector.
p | pointer to the AMRContext |
Definition at line 331 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Like ff_decode_pitch_lag(), but with 1/6 resolution.
Definition at line 376 of file amrnbdec.c.
Referenced by decode_pitch_vector().
|
static |
Definition at line 395 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Decode a 10-bit algebraic codebook index from a 10.2 kbit/s frame.
Definition at line 439 of file amrnbdec.c.
Referenced by decode_8_pulses_31bits().
Decode the algebraic codebook index to pulse positions and signs and construct the algebraic codebook vector for MODE_10k2.
fixed_index | positions of the eight pulses |
fixed_sparse | pointer to the algebraic codebook vector |
Definition at line 457 of file amrnbdec.c.
Referenced by decode_fixed_sparse().
|
static |
Decode the algebraic codebook index to pulse positions and signs, then construct the algebraic codebook vector.
nb of pulses | bits encoding pulses
For MODE_4k75 or MODE_5k15, 2 | 1-3, 4-6, 7 MODE_5k9, 2 | 1, 2-4, 5-6, 7-9 MODE_6k7, 3 | 1-3, 4, 5-7, 8, 9-11 MODE_7k4 or MODE_7k95, 4 | 1-3, 4-6, 7-9, 10, 11-13
fixed_sparse | pointer to the algebraic codebook vector |
pulses | algebraic codebook indexes |
mode | mode of the current frame |
subframe | current subframe number |
Definition at line 503 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Apply pitch lag to obtain the sharpened fixed vector (section 6.1.2)
p | the context |
subframe | unpacked amr subframe |
mode | mode of the current frame |
fixed_sparse | sparse respresentation of the fixed vector |
Definition at line 556 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
fixed gain smoothing Note that where the spec specifies the "spectrum in the q domain" in section 6.1.4, in fact frequencies should be used.
p | the context |
lsf | LSFs for the current subframe, in the range [0,1] |
lsf_avg | averaged LSFs |
mode | mode of the current frame |
Definition at line 592 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Decode pitch gain and fixed gain factor (part of section 6.1.3).
p | the context |
amr_subframe | unpacked amr subframe |
mode | mode of the current frame |
subframe | current subframe number |
fixed_gain_factor | decoded gain correction factor |
Definition at line 634 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
Circularly convolve a sparse fixed vector with a phase dispersion impulse response filter (D.6.2 of G.729 and 6.1.5 of AMR).
out | vector with filter applied |
in | source vector |
filter | phase filter coefficients |
out[n] = sum(i,0,len-1){ in[i] * filter[(len + n - i)len] }
< filters at pitch lag*1 and *2
Definition at line 676 of file amrnbdec.c.
Referenced by anti_sparseness().
|
static |
Reduce fixed vector sparseness by smoothing with one of three IR filters.
Also know as "adaptive phase dispersion".
This implements 3GPP TS 26.090 section 6.1(5).
p | the context |
fixed_sparse | algebraic codebook vector |
fixed_vector | unfiltered fixed vector |
fixed_gain | smoothed gain |
out | space for modified vector if necessary |
Definition at line 723 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Conduct 10th order linear predictive coding synthesis.
p | pointer to the AMRContext |
lpc | pointer to the LPC coefficients |
fixed_gain | fixed codebook gain for synthesis |
fixed_vector | algebraic codebook vector |
samples | pointer to the output speech samples |
overflow | 16-bit overflow flag |
Definition at line 794 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Update buffers and history at the end of decoding a subframe.
p | pointer to the AMRContext |
Definition at line 851 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Get the tilt factor of a formant filter from its transfer function.
p | The Context |
lpc_n | LP_FILTER_ORDER coefficients of the numerator |
lpc_d | LP_FILTER_ORDER coefficients of the denominator |
Definition at line 878 of file amrnbdec.c.
Referenced by postfilter().
|
static |
Perform adaptive post-filtering to enhance the quality of the speech.
See section 6.2.1.
p | pointer to the AMRContext |
lpc | interpolated LP coefficients for this subframe |
buf_out | output of the filter |
Definition at line 908 of file amrnbdec.c.
Referenced by amrnb_decode_frame().
|
static |
Definition at line 952 of file amrnbdec.c.
AVCodec ff_amrnb_decoder |
Definition at line 1089 of file amrnbdec.c.