From:http://www.cnblogs.com/myitm/archive/2011/07/21/2113299.html
view plaincopy to clipboardprint?
// demo.cpp : Defines the entry point for the console application.//
#include "stdafx.h"
#include <speex/speex.h>
#include <stdio.h>
#include <ostream>
#include <speex/speex_preprocess.h>
#include <speex/speex_echo.h>
#pragma comment(lib,"libspeexdsp.lib")
#define FRAME_SIZE 160
int main(int argc, char **argv)
{
char *inFile;
FILE *fin,*fout1,*fout2,*fout3;
short in[FRAME_SIZE];
short out[FRAME_SIZE];
float input[FRAME_SIZE];
float output[FRAME_SIZE];
char cbits[200];
int nbBytes;
/*保存編碼的狀態*/
void *stateEncode;
void *stateDecode;
/*保存字節因此他們可以被speex常規讀寫*/
SpeexBits bitsEncode;
SpeexBits bitsDecode;
int i, tmp;
//新建一個新的編碼狀態在窄寬(narrowband)模式下
stateEncode = speex_encoder_init(&speex_nb_mode);
stateDecode = speex_decoder_init(&speex_nb_mode);
//設置質量爲8(15kbps)
tmp=0;
speex_encoder_ctl(stateEncode, SPEEX_SET_VBR, &tmp);
float q=4;
speex_encoder_ctl(stateEncode, SPEEX_SET_VBR_QUALITY, &q);
speex_encoder_ctl(stateEncode, SPEEX_SET_QUALITY, &tmp);
inFile = argv[1];
fin = fopen("c:/demo.pcm", "rb");
fout1 = fopen("c:/demo_speex.raw", "wb");
fout2 = fopen("c:/demo1.pcm", "wb");
fout3 = fopen("c:/demo_slience.pcm", "wb");
//初始化結構使他們保存數據
speex_bits_init(&bitsEncode);
speex_bits_init(&bitsDecode);
int ret;
int j=0;
SpeexPreprocessState * m_st;
SpeexEchoState *echo_state;
m_st=speex_preprocess_state_init(160, 8000);
// echo_state = speex_echo_state_init(160, 8000);
int denoise = 1;
int noiseSuppress = -25;
speex_preprocess_ctl(m_st, SPEEX_PREPROCESS_SET_DENOISE, &denoise); //降噪
speex_preprocess_ctl(m_st, SPEEX_PREPROCESS_SET_NOISE_SUPPRESS, &noiseSuppress); //設置噪聲的dB
int agc = 1;
q=24000;
//actually default is 8000(0,32768),here make it louder for voice is not loudy enough by default. 8000
speex_preprocess_ctl(m_st, SPEEX_PREPROCESS_SET_AGC, &agc);//增益
speex_preprocess_ctl(m_st, SPEEX_PREPROCESS_SET_AGC_LEVEL,&q);
int vad = 1;
int vadProbStart = 80;
int vadProbContinue = 65;
speex_preprocess_ctl(m_st, SPEEX_PREPROCESS_SET_VAD, &vad); //靜音檢測
speex_preprocess_ctl(m_st, SPEEX_PREPROCESS_SET_PROB_START , &vadProbStart); //Set probability required for the VAD to go from silence to voice
speex_preprocess_ctl(m_st, SPEEX_PREPROCESS_SET_PROB_CONTINUE, &vadProbContinue); //Set probability required for the VAD to stay in the voice state (integer percent)
while (1)
{
memset(out,0,FRAME_SIZE*sizeof(short));
//讀入一幀16bits的聲音
j++;
int r=fread(in, sizeof(short), FRAME_SIZE, fin);
if (r<FRAME_SIZE)
break;
//把16bits的值轉化爲float,以便speex庫可以在上面工作
spx_int16_t * ptr=(spx_int16_t *)in;
if (speex_preprocess_run(m_st, ptr))//預處理 打開了靜音檢測和降噪
{
printf("speech,");
fwrite(in, sizeof(short), FRAME_SIZE, fout3);
}
else
{
printf("slience,");
fwrite(out, sizeof(short), FRAME_SIZE, fout3);
}
for (i=0;i<FRAME_SIZE;i++)
input[i]=in[i];
//清空這個結構體裏所有的字節,以便我們可以編碼一個新的幀
speex_bits_reset(&bitsEncode);
//對幀進行編碼
ret=speex_encode(stateEncode, input, &bitsEncode);
//把bits拷貝到一個利用寫出的char型數組
nbBytes = speex_bits_write(&bitsEncode, cbits, 200);
fwrite(cbits, sizeof(char), nbBytes, fout1);
printf("%02d,",nbBytes);
//清空這個結構體裏所有的字節,以便我們可以編碼一個新的幀
speex_bits_reset(&bitsDecode);
//將編碼數據如讀入bits
speex_bits_read_from(&bitsDecode, cbits, nbBytes);
//對幀進行解碼
ret = speex_decode(stateDecode, &bitsDecode,output);
for (i=0;i<FRAME_SIZE;i++)
out[i]=output[i];
fwrite(out, sizeof(short), FRAME_SIZE, fout2);
}
//釋放編碼器狀態量
speex_encoder_destroy(stateEncode);
//釋放bit_packing結構
speex_bits_destroy(&bitsEncode);
speex_decoder_destroy(stateDecode);
//釋放bit_packing結構
speex_bits_destroy(&bitsDecode);
fclose(fin);
fclose(fout1);
fclose(fout2);
fclose(fout3);
return 0;
}