You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
650 lines
14 KiB
650 lines
14 KiB
/* Copyright (C) 2002 Jean-Marc Valin
|
|
File: modes.c
|
|
|
|
Describes the different modes of the codec
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
modification, are permitted provided that the following conditions
|
|
are met:
|
|
|
|
- Redistributions of source code must retain the above copyright
|
|
notice, this list of conditions and the following disclaimer.
|
|
|
|
- Redistributions in binary form must reproduce the above copyright
|
|
notice, this list of conditions and the following disclaimer in the
|
|
documentation and/or other materials provided with the distribution.
|
|
|
|
- Neither the name of the Xiph.org Foundation nor the names of its
|
|
contributors may be used to endorse or promote products derived from
|
|
this software without specific prior written permission.
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
|
|
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
#include "modes.h"
|
|
#include "ltp.h"
|
|
#include "quant_lsp.h"
|
|
#include "cb_search.h"
|
|
#include "sb_celp.h"
|
|
#include "nb_celp.h"
|
|
#include "vbr.h"
|
|
#include "misc.h"
|
|
|
|
#ifndef NULL
|
|
#define NULL 0
|
|
#endif
|
|
|
|
SpeexMode *speex_mode_list[SPEEX_NB_MODES] = {&speex_nb_mode, &speex_wb_mode, &speex_uwb_mode};
|
|
|
|
/* Extern declarations for all codebooks we use here */
|
|
extern signed char gain_cdbk_nb[];
|
|
extern signed char gain_cdbk_lbr[];
|
|
extern signed char hexc_table[];
|
|
extern signed char exc_5_256_table[];
|
|
extern signed char exc_5_64_table[];
|
|
extern signed char exc_8_128_table[];
|
|
extern signed char exc_10_32_table[];
|
|
extern signed char exc_10_16_table[];
|
|
extern signed char exc_20_32_table[];
|
|
extern signed char hexc_10_32_table[];
|
|
|
|
static int nb_mode_query(void *mode, int request, void *ptr);
|
|
static int wb_mode_query(void *mode, int request, void *ptr);
|
|
|
|
/* Parameters for Long-Term Prediction (LTP)*/
|
|
static ltp_params ltp_params_nb = {
|
|
gain_cdbk_nb,
|
|
7,
|
|
7
|
|
};
|
|
|
|
/* Parameters for Long-Term Prediction (LTP)*/
|
|
static ltp_params ltp_params_vlbr = {
|
|
gain_cdbk_lbr,
|
|
5,
|
|
0
|
|
};
|
|
|
|
/* Parameters for Long-Term Prediction (LTP)*/
|
|
static ltp_params ltp_params_lbr = {
|
|
gain_cdbk_lbr,
|
|
5,
|
|
7
|
|
};
|
|
|
|
/* Parameters for Long-Term Prediction (LTP)*/
|
|
static ltp_params ltp_params_med = {
|
|
gain_cdbk_lbr,
|
|
5,
|
|
7
|
|
};
|
|
|
|
/* Split-VQ innovation parameters for very low bit-rate narrowband */
|
|
static split_cb_params split_cb_nb_vlbr = {
|
|
10, /*subvect_size*/
|
|
4, /*nb_subvect*/
|
|
exc_10_16_table, /*shape_cb*/
|
|
4, /*shape_bits*/
|
|
0,
|
|
};
|
|
|
|
/* Split-VQ innovation parameters for very low bit-rate narrowband */
|
|
static split_cb_params split_cb_nb_ulbr = {
|
|
20, /*subvect_size*/
|
|
2, /*nb_subvect*/
|
|
exc_20_32_table, /*shape_cb*/
|
|
5, /*shape_bits*/
|
|
0,
|
|
};
|
|
|
|
/* Split-VQ innovation parameters for low bit-rate narrowband */
|
|
static split_cb_params split_cb_nb_lbr = {
|
|
10, /*subvect_size*/
|
|
4, /*nb_subvect*/
|
|
exc_10_32_table, /*shape_cb*/
|
|
5, /*shape_bits*/
|
|
0,
|
|
};
|
|
|
|
|
|
/* Split-VQ innovation parameters narrowband */
|
|
static split_cb_params split_cb_nb = {
|
|
5, /*subvect_size*/
|
|
8, /*nb_subvect*/
|
|
exc_5_64_table, /*shape_cb*/
|
|
6, /*shape_bits*/
|
|
0,
|
|
};
|
|
|
|
/* Split-VQ innovation parameters narrowband */
|
|
static split_cb_params split_cb_nb_med = {
|
|
8, /*subvect_size*/
|
|
5, /*nb_subvect*/
|
|
exc_8_128_table, /*shape_cb*/
|
|
7, /*shape_bits*/
|
|
0,
|
|
};
|
|
|
|
/* Split-VQ innovation for low-band wideband */
|
|
static split_cb_params split_cb_sb = {
|
|
5, /*subvect_size*/
|
|
8, /*nb_subvect*/
|
|
exc_5_256_table, /*shape_cb*/
|
|
8, /*shape_bits*/
|
|
0,
|
|
};
|
|
|
|
/* Split-VQ innovation for high-band wideband */
|
|
static split_cb_params split_cb_high = {
|
|
8, /*subvect_size*/
|
|
5, /*nb_subvect*/
|
|
hexc_table, /*shape_cb*/
|
|
7, /*shape_bits*/
|
|
1,
|
|
};
|
|
|
|
|
|
/* Split-VQ innovation for high-band wideband */
|
|
static split_cb_params split_cb_high_lbr = {
|
|
10, /*subvect_size*/
|
|
4, /*nb_subvect*/
|
|
hexc_10_32_table, /*shape_cb*/
|
|
5, /*shape_bits*/
|
|
0,
|
|
};
|
|
|
|
/* 2150 bps "vocoder-like" mode for comfort noise */
|
|
static SpeexSubmode nb_submode1 = {
|
|
0,
|
|
1,
|
|
0,
|
|
0,
|
|
/* LSP quantization */
|
|
lsp_quant_lbr,
|
|
lsp_unquant_lbr,
|
|
/* No pitch quantization */
|
|
forced_pitch_quant,
|
|
forced_pitch_unquant,
|
|
NULL,
|
|
/* No innovation quantization (noise only) */
|
|
noise_codebook_quant,
|
|
noise_codebook_unquant,
|
|
NULL,
|
|
.7, .7, -1,
|
|
43
|
|
};
|
|
|
|
/* 3.95 kbps very low bit-rate mode */
|
|
static SpeexSubmode nb_submode8 = {
|
|
0,
|
|
1,
|
|
0,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_lbr,
|
|
lsp_unquant_lbr,
|
|
/*No pitch quantization*/
|
|
forced_pitch_quant,
|
|
forced_pitch_unquant,
|
|
NULL,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_nb_ulbr,
|
|
|
|
0.7, 0.5, .65,
|
|
79
|
|
};
|
|
|
|
/* 5.95 kbps very low bit-rate mode */
|
|
static SpeexSubmode nb_submode2 = {
|
|
0,
|
|
0,
|
|
0,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_lbr,
|
|
lsp_unquant_lbr,
|
|
/*No pitch quantization*/
|
|
pitch_search_3tap,
|
|
pitch_unquant_3tap,
|
|
<p_params_vlbr,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_nb_vlbr,
|
|
|
|
0.7, 0.5, .55,
|
|
119
|
|
};
|
|
|
|
/* 8 kbps low bit-rate mode */
|
|
static SpeexSubmode nb_submode3 = {
|
|
-1,
|
|
0,
|
|
1,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_lbr,
|
|
lsp_unquant_lbr,
|
|
/*Pitch quantization*/
|
|
pitch_search_3tap,
|
|
pitch_unquant_3tap,
|
|
<p_params_lbr,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_nb_lbr,
|
|
|
|
0.7, 0.55, .45,
|
|
160
|
|
};
|
|
|
|
/* 11 kbps medium bit-rate mode */
|
|
static SpeexSubmode nb_submode4 = {
|
|
-1,
|
|
0,
|
|
1,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_lbr,
|
|
lsp_unquant_lbr,
|
|
/*Pitch quantization*/
|
|
pitch_search_3tap,
|
|
pitch_unquant_3tap,
|
|
<p_params_med,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_nb_med,
|
|
|
|
0.7, 0.63, .35,
|
|
220
|
|
};
|
|
|
|
/* 15 kbps high bit-rate mode */
|
|
static SpeexSubmode nb_submode5 = {
|
|
-1,
|
|
0,
|
|
3,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_nb,
|
|
lsp_unquant_nb,
|
|
/*Pitch quantization*/
|
|
pitch_search_3tap,
|
|
pitch_unquant_3tap,
|
|
<p_params_nb,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_nb,
|
|
|
|
0.7, 0.65, .25,
|
|
300
|
|
};
|
|
|
|
/* 18.2 high bit-rate mode */
|
|
static SpeexSubmode nb_submode6 = {
|
|
-1,
|
|
0,
|
|
3,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_nb,
|
|
lsp_unquant_nb,
|
|
/*Pitch quantization*/
|
|
pitch_search_3tap,
|
|
pitch_unquant_3tap,
|
|
<p_params_nb,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_sb,
|
|
|
|
0.68, 0.65, .1,
|
|
364
|
|
};
|
|
|
|
/* 24.6 kbps high bit-rate mode */
|
|
static SpeexSubmode nb_submode7 = {
|
|
-1,
|
|
0,
|
|
3,
|
|
1,
|
|
/*LSP quantization*/
|
|
lsp_quant_nb,
|
|
lsp_unquant_nb,
|
|
/*Pitch quantization*/
|
|
pitch_search_3tap,
|
|
pitch_unquant_3tap,
|
|
<p_params_nb,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_nb,
|
|
|
|
0.65, 0.65, -1,
|
|
492
|
|
};
|
|
|
|
|
|
/* Default mode for narrowband */
|
|
static SpeexNBMode nb_mode = {
|
|
160, /*frameSize*/
|
|
40, /*subframeSize*/
|
|
10, /*lpcSize*/
|
|
640, /*bufSize*/
|
|
17, /*pitchStart*/
|
|
144, /*pitchEnd*/
|
|
0.9, /*gamma1*/
|
|
0.6, /*gamma2*/
|
|
.01, /*lag_factor*/
|
|
1.0001, /*lpc_floor*/
|
|
0.0, /*preemph*/
|
|
{NULL, &nb_submode1, &nb_submode2, &nb_submode3, &nb_submode4, &nb_submode5, &nb_submode6, &nb_submode7,
|
|
&nb_submode8, NULL, NULL, NULL, NULL, NULL, NULL, NULL},
|
|
5,
|
|
{1, 8, 2, 3, 3, 4, 4, 5, 5, 6, 7}
|
|
};
|
|
|
|
|
|
/* Default mode for narrowband */
|
|
SpeexMode speex_nb_mode = {
|
|
&nb_mode,
|
|
nb_mode_query,
|
|
"narrowband",
|
|
0,
|
|
4,
|
|
&nb_encoder_init,
|
|
&nb_encoder_destroy,
|
|
&nb_encode,
|
|
&nb_decoder_init,
|
|
&nb_decoder_destroy,
|
|
&nb_decode,
|
|
&nb_encoder_ctl,
|
|
&nb_decoder_ctl,
|
|
};
|
|
|
|
|
|
/* Wideband part */
|
|
|
|
static SpeexSubmode wb_submode1 = {
|
|
0,
|
|
0,
|
|
1,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_high,
|
|
lsp_unquant_high,
|
|
/*Pitch quantization*/
|
|
NULL,
|
|
NULL,
|
|
NULL,
|
|
/*No innovation quantization*/
|
|
NULL,
|
|
NULL,
|
|
NULL,
|
|
|
|
.75, .75, -1,
|
|
36
|
|
};
|
|
|
|
|
|
static SpeexSubmode wb_submode2 = {
|
|
0,
|
|
0,
|
|
1,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_high,
|
|
lsp_unquant_high,
|
|
/*Pitch quantization*/
|
|
NULL,
|
|
NULL,
|
|
NULL,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_high_lbr,
|
|
|
|
.85, .6, -1,
|
|
112
|
|
};
|
|
|
|
|
|
static SpeexSubmode wb_submode3 = {
|
|
0,
|
|
0,
|
|
1,
|
|
0,
|
|
/*LSP quantization*/
|
|
lsp_quant_high,
|
|
lsp_unquant_high,
|
|
/*Pitch quantization*/
|
|
NULL,
|
|
NULL,
|
|
NULL,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_high,
|
|
|
|
.75, .7, -1,
|
|
192
|
|
};
|
|
|
|
static SpeexSubmode wb_submode4 = {
|
|
0,
|
|
0,
|
|
1,
|
|
1,
|
|
/*LSP quantization*/
|
|
lsp_quant_high,
|
|
lsp_unquant_high,
|
|
/*Pitch quantization*/
|
|
NULL,
|
|
NULL,
|
|
NULL,
|
|
/*Innovation quantization*/
|
|
split_cb_search_shape_sign,
|
|
split_cb_shape_sign_unquant,
|
|
&split_cb_high,
|
|
|
|
.75, .75, -1,
|
|
352
|
|
};
|
|
|
|
|
|
/* Split-band wideband CELP mode*/
|
|
static SpeexSBMode sb_wb_mode = {
|
|
&speex_nb_mode,
|
|
160, /*frameSize*/
|
|
40, /*subframeSize*/
|
|
8, /*lpcSize*/
|
|
640, /*bufSize*/
|
|
.9, /*gamma1*/
|
|
0.6, /*gamma2*/
|
|
.002, /*lag_factor*/
|
|
1.0001, /*lpc_floor*/
|
|
0.0, /*preemph*/
|
|
0.9,
|
|
{NULL, &wb_submode1, &wb_submode2, &wb_submode3, &wb_submode4, NULL, NULL, NULL},
|
|
3,
|
|
{1, 8, 2, 3, 4, 5, 5, 6, 6, 7, 7},
|
|
{1, 1, 1, 1, 1, 1, 2, 2, 3, 3, 4},
|
|
vbr_hb_thresh,
|
|
5
|
|
};
|
|
|
|
|
|
SpeexMode speex_wb_mode = {
|
|
&sb_wb_mode,
|
|
wb_mode_query,
|
|
"wideband (sub-band CELP)",
|
|
1,
|
|
4,
|
|
&sb_encoder_init,
|
|
&sb_encoder_destroy,
|
|
&sb_encode,
|
|
&sb_decoder_init,
|
|
&sb_decoder_destroy,
|
|
&sb_decode,
|
|
&sb_encoder_ctl,
|
|
&sb_decoder_ctl,
|
|
};
|
|
|
|
|
|
|
|
/* "Ultra-wideband" mode stuff */
|
|
|
|
|
|
|
|
/* Split-band "ultra-wideband" (32 kbps) CELP mode*/
|
|
static SpeexSBMode sb_uwb_mode = {
|
|
&speex_wb_mode,
|
|
320, /*frameSize*/
|
|
80, /*subframeSize*/
|
|
8, /*lpcSize*/
|
|
1280, /*bufSize*/
|
|
.9, /*gamma1*/
|
|
0.6, /*gamma2*/
|
|
.002, /*lag_factor*/
|
|
1.0001, /*lpc_floor*/
|
|
0.0, /*preemph*/
|
|
0.7,
|
|
{NULL, &wb_submode1, NULL, NULL, NULL, NULL, NULL, NULL},
|
|
1,
|
|
{0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10},
|
|
{0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1},
|
|
vbr_uhb_thresh,
|
|
2
|
|
};
|
|
|
|
|
|
SpeexMode speex_uwb_mode = {
|
|
&sb_uwb_mode,
|
|
wb_mode_query,
|
|
"ultra-wideband (sub-band CELP)",
|
|
2,
|
|
4,
|
|
&sb_encoder_init,
|
|
&sb_encoder_destroy,
|
|
&sb_encode,
|
|
&sb_decoder_init,
|
|
&sb_decoder_destroy,
|
|
&sb_decode,
|
|
&sb_encoder_ctl,
|
|
&sb_decoder_ctl,
|
|
};
|
|
|
|
|
|
|
|
|
|
void *speex_encoder_init(SpeexMode *mode)
|
|
{
|
|
return mode->enc_init(mode);
|
|
}
|
|
|
|
void *speex_decoder_init(SpeexMode *mode)
|
|
{
|
|
return mode->dec_init(mode);
|
|
}
|
|
|
|
void speex_encoder_destroy(void *state)
|
|
{
|
|
(*((SpeexMode**)state))->enc_destroy(state);
|
|
}
|
|
|
|
int speex_encode(void *state, float *in, SpeexBits *bits)
|
|
{
|
|
return (*((SpeexMode**)state))->enc(state, in, bits);
|
|
}
|
|
|
|
void speex_decoder_destroy(void *state)
|
|
{
|
|
(*((SpeexMode**)state))->dec_destroy(state);
|
|
}
|
|
|
|
int speex_decode(void *state, SpeexBits *bits, float *out)
|
|
{
|
|
return (*((SpeexMode**)state))->dec(state, bits, out);
|
|
}
|
|
|
|
|
|
int speex_encoder_ctl(void *state, int request, void *ptr)
|
|
{
|
|
return (*((SpeexMode**)state))->enc_ctl(state, request, ptr);
|
|
}
|
|
|
|
int speex_decoder_ctl(void *state, int request, void *ptr)
|
|
{
|
|
return (*((SpeexMode**)state))->dec_ctl(state, request, ptr);
|
|
}
|
|
|
|
|
|
|
|
static int nb_mode_query(void *mode, int request, void *ptr)
|
|
{
|
|
SpeexNBMode *m = (SpeexNBMode*)mode;
|
|
|
|
switch (request)
|
|
{
|
|
case SPEEX_MODE_FRAME_SIZE:
|
|
*((int*)ptr)=m->frameSize;
|
|
break;
|
|
case SPEEX_SUBMODE_BITS_PER_FRAME:
|
|
if (*((int*)ptr)==0)
|
|
*((int*)ptr) = NB_SUBMODE_BITS+1;
|
|
else if (m->submodes[*((int*)ptr)]==NULL)
|
|
*((int*)ptr) = -1;
|
|
else
|
|
*((int*)ptr) = m->submodes[*((int*)ptr)]->bits_per_frame;
|
|
break;
|
|
default:
|
|
speex_warning_int("Unknown nb_mode_query request: ", request);
|
|
return -1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int wb_mode_query(void *mode, int request, void *ptr)
|
|
{
|
|
SpeexSBMode *m = (SpeexSBMode*)mode;
|
|
|
|
switch (request)
|
|
{
|
|
case SPEEX_MODE_FRAME_SIZE:
|
|
*((int*)ptr)=2*m->frameSize;
|
|
break;
|
|
case SPEEX_SUBMODE_BITS_PER_FRAME:
|
|
if (*((int*)ptr)==0)
|
|
*((int*)ptr) = SB_SUBMODE_BITS+1;
|
|
else if (m->submodes[*((int*)ptr)]==NULL)
|
|
*((int*)ptr) = -1;
|
|
else
|
|
*((int*)ptr) = m->submodes[*((int*)ptr)]->bits_per_frame;
|
|
break;
|
|
default:
|
|
speex_warning_int("Unknown wb_mode_query request: ", request);
|
|
return -1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
|
|
int speex_mode_query(SpeexMode *mode, int request, void *ptr)
|
|
{
|
|
return mode->query(mode->mode, request, ptr);
|
|
}
|