libavcodec/g723_1.h - manifest_repos/ffmpeg - Git at Google

 /*
  * G.723.1 common header and data tables
  * Copyright (c) 2006 Benjamin Larsson
  * Copyright (c) 2010 Mohamed Naufal Basheer
  *
  * This file is part of FFmpeg.
  *
  * FFmpeg is free software; you can redistribute it and/or
  * modify it under the terms of the GNU Lesser General Public
  * License as published by the Free Software Foundation; either
  * version 2.1 of the License, or (at your option) any later version.
  *
  * FFmpeg is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  * Lesser General Public License for more details.
  *
  * You should have received a copy of the GNU Lesser General Public
  * License along with FFmpeg; if not, write to the Free Software
  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  */

 /**
  * @file
  * G.723.1 types, functions and data tables
  */

 #ifndef AVCODEC_G723_1_H
 #define AVCODEC_G723_1_H

 #include <stdint.h>

 #include "libavutil/log.h"

 #define SUBFRAMES       4
 #define SUBFRAME_LEN    60
 #define FRAME_LEN       (SUBFRAME_LEN << 2)
 #define HALF_FRAME_LEN  (FRAME_LEN / 2)
 #define LPC_FRAME       (HALF_FRAME_LEN + SUBFRAME_LEN)
 #define LPC_ORDER       10
 #define LSP_BANDS       3
 #define LSP_CB_SIZE     256
 #define PITCH_MIN       18
 #define PITCH_MAX       (PITCH_MIN + 127)
 #define PITCH_ORDER     5
 #define GRID_SIZE       2
 #define PULSE_MAX       6
 #define GAIN_LEVELS     24
 #define COS_TBL_SIZE    512

 /**
  * Bitexact implementation of 2ab scaled by 1/2^16.
  *
  * @param a 32 bit multiplicand
  * @param b 16 bit multiplier
  */
 #define MULL2(a, b) \
         ((((a) >> 16) * (b) * 2) + (((a) & 0xffff) * (b) >> 15))

 /**
  * G723.1 frame types
  */
 enum FrameType {
     ACTIVE_FRAME,        ///< Active speech
     SID_FRAME,           ///< Silence Insertion Descriptor frame
     UNTRANSMITTED_FRAME
 };

 /**
  * G723.1 rate values
  */
 enum Rate {
     RATE_6300,
     RATE_5300
 };

 /**
  * G723.1 unpacked data subframe
  */
 typedef struct G723_1_Subframe {
     int ad_cb_lag;     ///< adaptive codebook lag
     int ad_cb_gain;
     int dirac_train;
     int pulse_sign;
     int grid_index;
     int amp_index;
     int pulse_pos;
 } G723_1_Subframe;

 /**
  * Pitch postfilter parameters
  */
 typedef struct PPFParam {
     int     index;    ///< postfilter backward/forward lag
     int16_t opt_gain; ///< optimal gain
     int16_t sc_gain;  ///< scaling gain
 } PPFParam;

 /**
  * Harmonic filter parameters
  */
 typedef struct HFParam {
     int index;
     int gain;
 } HFParam;

 /**
  * Optimized fixed codebook excitation parameters
  */
 typedef struct FCBParam {
     int min_err;
     int amp_index;
     int grid_index;
     int dirac_train;
     int pulse_pos[PULSE_MAX];
     int pulse_sign[PULSE_MAX];
 } FCBParam;

 typedef struct G723_1_ChannelContext {
     G723_1_Subframe subframe[4];
     enum FrameType cur_frame_type;
     enum FrameType past_frame_type;
     enum Rate cur_rate;
     uint8_t lsp_index[LSP_BANDS];
     int pitch_lag[2];
     int erased_frames;

     int16_t prev_lsp[LPC_ORDER];
     int16_t sid_lsp[LPC_ORDER];
     int16_t prev_excitation[PITCH_MAX];
     int16_t excitation[PITCH_MAX + FRAME_LEN + 4];
     int16_t synth_mem[LPC_ORDER];
     int16_t fir_mem[LPC_ORDER];
     int     iir_mem[LPC_ORDER];

     int random_seed;
     int cng_random_seed;
     int interp_index;
     int interp_gain;
     int sid_gain;
     int cur_gain;
     int reflection_coef;
     int pf_gain;                 ///< formant postfilter
                                  ///< gain scaling unit memory
     int16_t audio[FRAME_LEN + LPC_ORDER + PITCH_MAX + 4];

     /* encoder */
     int16_t prev_data[HALF_FRAME_LEN];
     int16_t prev_weight_sig[PITCH_MAX];

     int16_t hpf_fir_mem;                   ///< highpass filter fir
     int     hpf_iir_mem;                   ///< and iir memories
     int16_t perf_fir_mem[LPC_ORDER];       ///< perceptual filter fir
     int16_t perf_iir_mem[LPC_ORDER];       ///< and iir memories

     int16_t harmonic_mem[PITCH_MAX];
 } G723_1_ChannelContext;

 typedef struct G723_1_Context {
     AVClass *class;
     int postfilter;

     G723_1_ChannelContext ch[2];
 } G723_1_Context;


 /**
  * Scale vector contents based on the largest of their absolutes.
  */
 int ff_g723_1_scale_vector(int16_t *dst, const int16_t *vector, int length);

 /**
  * Calculate the number of left-shifts required for normalizing the input.
  *
  * @param num   input number
  * @param width width of the input, 16 bits(0) / 32 bits(1)
  */
 int ff_g723_1_normalize_bits(int num, int width);

 int ff_g723_1_dot_product(const int16_t *a, const int16_t *b, int length);

 /**
  * Get delayed contribution from the previous excitation vector.
  */
 void ff_g723_1_get_residual(int16_t *residual, int16_t *prev_excitation,
                             int lag);

 /**
  * Generate a train of dirac functions with period as pitch lag.
  */
 void ff_g723_1_gen_dirac_train(int16_t *buf, int pitch_lag);


 /**
  * Generate adaptive codebook excitation.
  */
 void ff_g723_1_gen_acb_excitation(int16_t *vector, int16_t *prev_excitation,
                                   int pitch_lag, G723_1_Subframe *subfrm,
                                   enum Rate cur_rate);
 /**
  * Quantize LSP frequencies by interpolation and convert them to
  * the corresponding LPC coefficients.
  *
  * @param lpc      buffer for LPC coefficients
  * @param cur_lsp  the current LSP vector
  * @param prev_lsp the previous LSP vector
  */
 void ff_g723_1_lsp_interpolate(int16_t *lpc, int16_t *cur_lsp,
                                int16_t *prev_lsp);

 /**
  * Perform inverse quantization of LSP frequencies.
  *
  * @param cur_lsp    the current LSP vector
  * @param prev_lsp   the previous LSP vector
  * @param lsp_index  VQ indices
  * @param bad_frame  bad frame flag
  */
 void ff_g723_1_inverse_quant(int16_t *cur_lsp, int16_t *prev_lsp,
                              uint8_t *lsp_index, int bad_frame);

 static const uint8_t frame_size[4] = { 24, 20, 4, 1 };

 /**
  * LSP DC component
  */
 static const int16_t dc_lsp[LPC_ORDER] = {
     0x0c3b,
     0x1271,
     0x1e0a,
     0x2a36,
     0x3630,
     0x406f,
     0x4d28,
     0x56f4,
     0x638c,
     0x6c46
 };

 /* Cosine table scaled by 2^14 */
 extern const int16_t ff_g723_1_cos_tab[COS_TBL_SIZE + 1];
 #define G723_1_COS_TAB_FIRST_ELEMENT 16384

 /**
  *  LSP VQ tables
  */
 extern const int16_t ff_g723_1_lsp_band0[LSP_CB_SIZE][3];
 extern const int16_t ff_g723_1_lsp_band1[LSP_CB_SIZE][3];
 extern const int16_t ff_g723_1_lsp_band2[LSP_CB_SIZE][4];

 /**
  * Used for the coding/decoding of the pulses positions
  * for the MP-MLQ codebook
  */
 extern const int32_t ff_g723_1_combinatorial_table[PULSE_MAX][SUBFRAME_LEN/GRID_SIZE];

 /**
  * Number of non-zero pulses in the MP-MLQ excitation
  */
 static const int8_t pulses[4] = {6, 5, 6, 5};

 extern const int16_t ff_g723_1_fixed_cb_gain[GAIN_LEVELS];

 extern const int16_t ff_g723_1_adaptive_cb_gain85 [ 85 * 20];
 extern const int16_t ff_g723_1_adaptive_cb_gain170[170 * 20];

 #endif /* AVCODEC_G723_1_H */
	/*
	* G.723.1 common header and data tables
	* Copyright (c) 2006 Benjamin Larsson
	* Copyright (c) 2010 Mohamed Naufal Basheer
	*
	* This file is part of FFmpeg.
	*
	* FFmpeg is free software; you can redistribute it and/or
	* modify it under the terms of the GNU Lesser General Public
	* License as published by the Free Software Foundation; either
	* version 2.1 of the License, or (at your option) any later version.
	*
	* FFmpeg is distributed in the hope that it will be useful,
	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	* Lesser General Public License for more details.
	*
	* You should have received a copy of the GNU Lesser General Public
	* License along with FFmpeg; if not, write to the Free Software
	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	*/

	/**
	* @file
	* G.723.1 types, functions and data tables
	*/

	#ifndef AVCODEC_G723_1_H
	#define AVCODEC_G723_1_H

	#include <stdint.h>

	#include "libavutil/log.h"

	#define SUBFRAMES 4
	#define SUBFRAME_LEN 60
	#define FRAME_LEN (SUBFRAME_LEN << 2)
	#define HALF_FRAME_LEN (FRAME_LEN / 2)
	#define LPC_FRAME (HALF_FRAME_LEN + SUBFRAME_LEN)
	#define LPC_ORDER 10
	#define LSP_BANDS 3
	#define LSP_CB_SIZE 256
	#define PITCH_MIN 18
	#define PITCH_MAX (PITCH_MIN + 127)
	#define PITCH_ORDER 5
	#define GRID_SIZE 2
	#define PULSE_MAX 6
	#define GAIN_LEVELS 24
	#define COS_TBL_SIZE 512

	/**
	* Bitexact implementation of 2ab scaled by 1/2^16.
	*
	* @param a 32 bit multiplicand
	* @param b 16 bit multiplier
	*/
	#define MULL2(a, b) \
	((((a) >> 16) * (b) * 2) + (((a) & 0xffff) * (b) >> 15))

	/**
	* G723.1 frame types
	*/
	enum FrameType {
	ACTIVE_FRAME, ///< Active speech
	SID_FRAME, ///< Silence Insertion Descriptor frame
	UNTRANSMITTED_FRAME
	};

	/**
	* G723.1 rate values
	*/
	enum Rate {
	RATE_6300,
	RATE_5300
	};

	/**
	* G723.1 unpacked data subframe
	*/
	typedef struct G723_1_Subframe {
	int ad_cb_lag; ///< adaptive codebook lag
	int ad_cb_gain;
	int dirac_train;
	int pulse_sign;
	int grid_index;
	int amp_index;
	int pulse_pos;
	} G723_1_Subframe;

	/**
	* Pitch postfilter parameters
	*/
	typedef struct PPFParam {
	int index; ///< postfilter backward/forward lag
	int16_t opt_gain; ///< optimal gain
	int16_t sc_gain; ///< scaling gain
	} PPFParam;

	/**
	* Harmonic filter parameters
	*/
	typedef struct HFParam {
	int index;
	int gain;
	} HFParam;

	/**
	* Optimized fixed codebook excitation parameters
	*/
	typedef struct FCBParam {
	int min_err;
	int amp_index;
	int grid_index;
	int dirac_train;
	int pulse_pos[PULSE_MAX];
	int pulse_sign[PULSE_MAX];
	} FCBParam;

	typedef struct G723_1_ChannelContext {
	G723_1_Subframe subframe[4];
	enum FrameType cur_frame_type;
	enum FrameType past_frame_type;
	enum Rate cur_rate;
	uint8_t lsp_index[LSP_BANDS];
	int pitch_lag[2];
	int erased_frames;

	int16_t prev_lsp[LPC_ORDER];
	int16_t sid_lsp[LPC_ORDER];
	int16_t prev_excitation[PITCH_MAX];
	int16_t excitation[PITCH_MAX + FRAME_LEN + 4];
	int16_t synth_mem[LPC_ORDER];
	int16_t fir_mem[LPC_ORDER];
	int iir_mem[LPC_ORDER];

	int random_seed;
	int cng_random_seed;
	int interp_index;
	int interp_gain;
	int sid_gain;
	int cur_gain;
	int reflection_coef;
	int pf_gain; ///< formant postfilter
	///< gain scaling unit memory
	int16_t audio[FRAME_LEN + LPC_ORDER + PITCH_MAX + 4];

	/* encoder */
	int16_t prev_data[HALF_FRAME_LEN];
	int16_t prev_weight_sig[PITCH_MAX];

	int16_t hpf_fir_mem; ///< highpass filter fir
	int hpf_iir_mem; ///< and iir memories
	int16_t perf_fir_mem[LPC_ORDER]; ///< perceptual filter fir
	int16_t perf_iir_mem[LPC_ORDER]; ///< and iir memories

	int16_t harmonic_mem[PITCH_MAX];
	} G723_1_ChannelContext;

	typedef struct G723_1_Context {
	AVClass *class;
	int postfilter;

	G723_1_ChannelContext ch[2];
	} G723_1_Context;


	/**
	* Scale vector contents based on the largest of their absolutes.
	*/
	int ff_g723_1_scale_vector(int16_t dst, const int16_t vector, int length);

	/**
	* Calculate the number of left-shifts required for normalizing the input.
	*
	* @param num input number
	* @param width width of the input, 16 bits(0) / 32 bits(1)
	*/
	int ff_g723_1_normalize_bits(int num, int width);

	int ff_g723_1_dot_product(const int16_t a, const int16_t b, int length);

	/**
	* Get delayed contribution from the previous excitation vector.
	*/
	void ff_g723_1_get_residual(int16_t residual, int16_t prev_excitation,
	int lag);

	/**
	* Generate a train of dirac functions with period as pitch lag.
	*/
	void ff_g723_1_gen_dirac_train(int16_t *buf, int pitch_lag);


	/**
	* Generate adaptive codebook excitation.
	*/
	void ff_g723_1_gen_acb_excitation(int16_t vector, int16_t prev_excitation,
	int pitch_lag, G723_1_Subframe *subfrm,
	enum Rate cur_rate);
	/**
	* Quantize LSP frequencies by interpolation and convert them to
	* the corresponding LPC coefficients.
	*
	* @param lpc buffer for LPC coefficients
	* @param cur_lsp the current LSP vector
	* @param prev_lsp the previous LSP vector
	*/
	void ff_g723_1_lsp_interpolate(int16_t lpc, int16_t cur_lsp,
	int16_t *prev_lsp);

	/**
	* Perform inverse quantization of LSP frequencies.
	*
	* @param cur_lsp the current LSP vector
	* @param prev_lsp the previous LSP vector
	* @param lsp_index VQ indices
	* @param bad_frame bad frame flag
	*/
	void ff_g723_1_inverse_quant(int16_t cur_lsp, int16_t prev_lsp,
	uint8_t *lsp_index, int bad_frame);

	static const uint8_t frame_size[4] = { 24, 20, 4, 1 };

	/**
	* LSP DC component
	*/
	static const int16_t dc_lsp[LPC_ORDER] = {
	0x0c3b,
	0x1271,
	0x1e0a,
	0x2a36,
	0x3630,
	0x406f,
	0x4d28,
	0x56f4,
	0x638c,
	0x6c46
	};

	/* Cosine table scaled by 2^14 */
	extern const int16_t ff_g723_1_cos_tab[COS_TBL_SIZE + 1];
	#define G723_1_COS_TAB_FIRST_ELEMENT 16384

	/**
	* LSP VQ tables
	*/
	extern const int16_t ff_g723_1_lsp_band0[LSP_CB_SIZE][3];
	extern const int16_t ff_g723_1_lsp_band1[LSP_CB_SIZE][3];
	extern const int16_t ff_g723_1_lsp_band2[LSP_CB_SIZE][4];

	/**
	* Used for the coding/decoding of the pulses positions
	* for the MP-MLQ codebook
	*/
	extern const int32_t ff_g723_1_combinatorial_table[PULSE_MAX][SUBFRAME_LEN/GRID_SIZE];

	/**
	* Number of non-zero pulses in the MP-MLQ excitation
	*/
	static const int8_t pulses[4] = {6, 5, 6, 5};

	extern const int16_t ff_g723_1_fixed_cb_gain[GAIN_LEVELS];

	extern const int16_t ff_g723_1_adaptive_cb_gain85 [ 85 * 20];
	extern const int16_t ff_g723_1_adaptive_cb_gain170[170 * 20];

	#endif /* AVCODEC_G723_1_H */