You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
147 lines
6.4 KiB
147 lines
6.4 KiB
4 years ago
|
/* Copyright (C) 2002 Jean-Marc Valin */
|
||
|
/**
|
||
|
@file modes.h
|
||
|
@brief Describes the different modes of the codec
|
||
|
*/
|
||
|
/*
|
||
|
Redistribution and use in source and binary forms, with or without
|
||
|
modification, are permitted provided that the following conditions
|
||
|
are met:
|
||
|
|
||
|
- Redistributions of source code must retain the above copyright
|
||
|
notice, this list of conditions and the following disclaimer.
|
||
|
|
||
|
- Redistributions in binary form must reproduce the above copyright
|
||
|
notice, this list of conditions and the following disclaimer in the
|
||
|
documentation and/or other materials provided with the distribution.
|
||
|
|
||
|
- Neither the name of the Xiph.org Foundation nor the names of its
|
||
|
contributors may be used to endorse or promote products derived from
|
||
|
this software without specific prior written permission.
|
||
|
|
||
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||
|
``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||
|
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||
|
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
|
||
|
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||
|
|
||
|
*/
|
||
|
|
||
|
#ifndef MODES_H
|
||
|
#define MODES_H
|
||
|
|
||
|
#include "speex.h"
|
||
|
#include "speex_bits.h"
|
||
|
|
||
|
|
||
|
#define NB_SUBMODES 16
|
||
|
#define NB_SUBMODE_BITS 4
|
||
|
|
||
|
#define SB_SUBMODES 8
|
||
|
#define SB_SUBMODE_BITS 3
|
||
|
|
||
|
|
||
|
/** Quantizes LSPs */
|
||
|
typedef void (*lsp_quant_func)(float *, float *, int, SpeexBits *);
|
||
|
|
||
|
/** Decodes quantized LSPs */
|
||
|
typedef void (*lsp_unquant_func)(float *, int, SpeexBits *);
|
||
|
|
||
|
|
||
|
/** Long-term predictor quantization */
|
||
|
typedef int (*ltp_quant_func)(float *, float *, float *, float *,
|
||
|
float *, float *, void *, int, int, float,
|
||
|
int, int, SpeexBits*, char *, float *, float *, int);
|
||
|
|
||
|
/** Long-term un-quantize */
|
||
|
typedef void (*ltp_unquant_func)(float *, int, int, float, void *, int, int *,
|
||
|
float *, SpeexBits*, char*, int, int, float);
|
||
|
|
||
|
|
||
|
/** Innovation quantization function */
|
||
|
typedef void (*innovation_quant_func)(float *, float *, float *, float *, void *, int, int,
|
||
|
float *, float *, SpeexBits *, char *, int);
|
||
|
|
||
|
/** Innovation unquantization function */
|
||
|
typedef void (*innovation_unquant_func)(float *, void *, int, SpeexBits*, char *);
|
||
|
|
||
|
/** Description of a Speex sub-mode (wither narrowband or wideband */
|
||
|
typedef struct SpeexSubmode {
|
||
|
int lbr_pitch; /**< Set to -1 for "normal" modes, otherwise encode pitch using a global pitch and allowing a +- lbr_pitch variation (for low not-rates)*/
|
||
|
int forced_pitch_gain; /**< Use the same (forced) pitch gain for all sub-frames */
|
||
|
int have_subframe_gain; /**< Number of bits to use as sub-frame innovation gain */
|
||
|
int double_codebook; /**< Apply innovation quantization twice for higher quality (and higher bit-rate)*/
|
||
|
/*LSP functions*/
|
||
|
lsp_quant_func lsp_quant; /**< LSP quantization function */
|
||
|
lsp_unquant_func lsp_unquant; /**< LSP unquantization function */
|
||
|
|
||
|
/*Lont-term predictor functions*/
|
||
|
ltp_quant_func ltp_quant; /**< Long-term predictor (pitch) quantizer */
|
||
|
ltp_unquant_func ltp_unquant; /**< Long-term predictor (pitch) un-quantizer */
|
||
|
void *ltp_params; /**< Pitch parameters (options) */
|
||
|
|
||
|
/*Quantization of innovation*/
|
||
|
innovation_quant_func innovation_quant; /**< Innovation quantization */
|
||
|
innovation_unquant_func innovation_unquant; /**< Innovation un-quantization */
|
||
|
void *innovation_params; /**< Innovation quantization parameters*/
|
||
|
|
||
|
/*Synthesis filter enhancement*/
|
||
|
float lpc_enh_k1; /**< Enhancer constant */
|
||
|
float lpc_enh_k2; /**< Enhancer constant */
|
||
|
float comb_gain; /**< Gain of enhancer comb filter */
|
||
|
|
||
|
int bits_per_frame; /**< Number of bits per frame after encoding*/
|
||
|
} SpeexSubmode;
|
||
|
|
||
|
/** Struct defining the encoding/decoding mode*/
|
||
|
typedef struct SpeexNBMode {
|
||
|
int frameSize; /**< Size of frames used for encoding */
|
||
|
int subframeSize; /**< Size of sub-frames used for encoding */
|
||
|
int lpcSize; /**< Order of LPC filter */
|
||
|
int bufSize; /**< Size of signal buffer to use in encoder */
|
||
|
int pitchStart; /**< Smallest pitch value allowed */
|
||
|
int pitchEnd; /**< Largest pitch value allowed */
|
||
|
|
||
|
float gamma1; /**< Perceptual filter parameter #1 */
|
||
|
float gamma2; /**< Perceptual filter parameter #2 */
|
||
|
float lag_factor; /**< Lag-windowing parameter */
|
||
|
float lpc_floor; /**< Noise floor for LPC analysis */
|
||
|
float preemph; /**< Pre-emphasis */
|
||
|
|
||
|
SpeexSubmode *submodes[NB_SUBMODES]; /**< Sub-mode data for the mode */
|
||
|
int defaultSubmode; /**< Default sub-mode to use when encoding */
|
||
|
int quality_map[11]; /**< Mode corresponding to each quality setting */
|
||
|
} SpeexNBMode;
|
||
|
|
||
|
|
||
|
/** Struct defining the encoding/decoding mode for SB-CELP (wideband) */
|
||
|
typedef struct SpeexSBMode {
|
||
|
SpeexMode *nb_mode; /**< Embedded narrowband mode */
|
||
|
int frameSize; /**< Size of frames used for encoding */
|
||
|
int subframeSize; /**< Size of sub-frames used for encoding */
|
||
|
int lpcSize; /**< Order of LPC filter */
|
||
|
int bufSize; /**< Signal buffer size in encoder */
|
||
|
float gamma1; /**< Perceptual filter parameter #1 */
|
||
|
float gamma2; /**< Perceptual filter parameter #1 */
|
||
|
float lag_factor; /**< Lag-windowing parameter */
|
||
|
float lpc_floor; /**< Noise floor for LPC analysis */
|
||
|
float preemph; /**< Pre-emphasis */
|
||
|
float folding_gain;
|
||
|
|
||
|
SpeexSubmode *submodes[SB_SUBMODES]; /**< Sub-mode data for the mode */
|
||
|
int defaultSubmode; /**< Default sub-mode to use when encoding */
|
||
|
int low_quality_map[11]; /**< Mode corresponding to each quality setting */
|
||
|
int quality_map[11]; /**< Mode corresponding to each quality setting */
|
||
|
float (*vbr_thresh)[11];
|
||
|
int nb_modes;
|
||
|
} SpeexSBMode;
|
||
|
|
||
|
|
||
|
#endif
|