You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
146 lines
6.5 KiB
146 lines
6.5 KiB
/* Copyright (C) 2002 Jean-Marc Valin */ |
|
/** |
|
@file modes.h |
|
@brief Describes the different modes of the codec |
|
*/ |
|
/* |
|
Redistribution and use in source and binary forms, with or without |
|
modification, are permitted provided that the following conditions |
|
are met: |
|
|
|
- Redistributions of source code must retain the above copyright |
|
notice, this list of conditions and the following disclaimer. |
|
|
|
- Redistributions in binary form must reproduce the above copyright |
|
notice, this list of conditions and the following disclaimer in the |
|
documentation and/or other materials provided with the distribution. |
|
|
|
- Neither the name of the Xiph.org Foundation nor the names of its |
|
contributors may be used to endorse or promote products derived from |
|
this software without specific prior written permission. |
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
|
``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
|
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
|
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR |
|
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF |
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING |
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
|
|
*/ |
|
|
|
#ifndef MODES_H |
|
#define MODES_H |
|
|
|
#include "speex.h" |
|
#include "speex_bits.h" |
|
|
|
|
|
#define NB_SUBMODES 16 |
|
#define NB_SUBMODE_BITS 4 |
|
|
|
#define SB_SUBMODES 8 |
|
#define SB_SUBMODE_BITS 3 |
|
|
|
|
|
/** Quantizes LSPs */ |
|
typedef void (*lsp_quant_func)(float *, float *, int, SpeexBits *); |
|
|
|
/** Decodes quantized LSPs */ |
|
typedef void (*lsp_unquant_func)(float *, int, SpeexBits *); |
|
|
|
|
|
/** Long-term predictor quantization */ |
|
typedef int (*ltp_quant_func)(float *, float *, float *, float *, |
|
float *, float *, void *, int, int, float, |
|
int, int, SpeexBits*, char *, float *, float *, int); |
|
|
|
/** Long-term un-quantize */ |
|
typedef void (*ltp_unquant_func)(float *, int, int, float, void *, int, int *, |
|
float *, SpeexBits*, char*, int, int, float); |
|
|
|
|
|
/** Innovation quantization function */ |
|
typedef void (*innovation_quant_func)(float *, float *, float *, float *, void *, int, int, |
|
float *, float *, SpeexBits *, char *, int); |
|
|
|
/** Innovation unquantization function */ |
|
typedef void (*innovation_unquant_func)(float *, void *, int, SpeexBits*, char *); |
|
|
|
/** Description of a Speex sub-mode (wither narrowband or wideband */ |
|
typedef struct SpeexSubmode { |
|
int lbr_pitch; /**< Set to -1 for "normal" modes, otherwise encode pitch using a global pitch and allowing a +- lbr_pitch variation (for low not-rates)*/ |
|
int forced_pitch_gain; /**< Use the same (forced) pitch gain for all sub-frames */ |
|
int have_subframe_gain; /**< Number of bits to use as sub-frame innovation gain */ |
|
int double_codebook; /**< Apply innovation quantization twice for higher quality (and higher bit-rate)*/ |
|
/*LSP functions*/ |
|
lsp_quant_func lsp_quant; /**< LSP quantization function */ |
|
lsp_unquant_func lsp_unquant; /**< LSP unquantization function */ |
|
|
|
/*Lont-term predictor functions*/ |
|
ltp_quant_func ltp_quant; /**< Long-term predictor (pitch) quantizer */ |
|
ltp_unquant_func ltp_unquant; /**< Long-term predictor (pitch) un-quantizer */ |
|
void *ltp_params; /**< Pitch parameters (options) */ |
|
|
|
/*Quantization of innovation*/ |
|
innovation_quant_func innovation_quant; /**< Innovation quantization */ |
|
innovation_unquant_func innovation_unquant; /**< Innovation un-quantization */ |
|
void *innovation_params; /**< Innovation quantization parameters*/ |
|
|
|
/*Synthesis filter enhancement*/ |
|
float lpc_enh_k1; /**< Enhancer constant */ |
|
float lpc_enh_k2; /**< Enhancer constant */ |
|
float comb_gain; /**< Gain of enhancer comb filter */ |
|
|
|
int bits_per_frame; /**< Number of bits per frame after encoding*/ |
|
} SpeexSubmode; |
|
|
|
/** Struct defining the encoding/decoding mode*/ |
|
typedef struct SpeexNBMode { |
|
int frameSize; /**< Size of frames used for encoding */ |
|
int subframeSize; /**< Size of sub-frames used for encoding */ |
|
int lpcSize; /**< Order of LPC filter */ |
|
int bufSize; /**< Size of signal buffer to use in encoder */ |
|
int pitchStart; /**< Smallest pitch value allowed */ |
|
int pitchEnd; /**< Largest pitch value allowed */ |
|
|
|
float gamma1; /**< Perceptual filter parameter #1 */ |
|
float gamma2; /**< Perceptual filter parameter #2 */ |
|
float lag_factor; /**< Lag-windowing parameter */ |
|
float lpc_floor; /**< Noise floor for LPC analysis */ |
|
float preemph; /**< Pre-emphasis */ |
|
|
|
SpeexSubmode *submodes[NB_SUBMODES]; /**< Sub-mode data for the mode */ |
|
int defaultSubmode; /**< Default sub-mode to use when encoding */ |
|
int quality_map[11]; /**< Mode corresponding to each quality setting */ |
|
} SpeexNBMode; |
|
|
|
|
|
/** Struct defining the encoding/decoding mode for SB-CELP (wideband) */ |
|
typedef struct SpeexSBMode { |
|
SpeexMode *nb_mode; /**< Embedded narrowband mode */ |
|
int frameSize; /**< Size of frames used for encoding */ |
|
int subframeSize; /**< Size of sub-frames used for encoding */ |
|
int lpcSize; /**< Order of LPC filter */ |
|
int bufSize; /**< Signal buffer size in encoder */ |
|
float gamma1; /**< Perceptual filter parameter #1 */ |
|
float gamma2; /**< Perceptual filter parameter #1 */ |
|
float lag_factor; /**< Lag-windowing parameter */ |
|
float lpc_floor; /**< Noise floor for LPC analysis */ |
|
float preemph; /**< Pre-emphasis */ |
|
float folding_gain; |
|
|
|
SpeexSubmode *submodes[SB_SUBMODES]; /**< Sub-mode data for the mode */ |
|
int defaultSubmode; /**< Default sub-mode to use when encoding */ |
|
int low_quality_map[11]; /**< Mode corresponding to each quality setting */ |
|
int quality_map[11]; /**< Mode corresponding to each quality setting */ |
|
float (*vbr_thresh)[11]; |
|
int nb_modes; |
|
} SpeexSBMode; |
|
|
|
|
|
#endif
|
|
|