add .gitignore
This commit is contained in:
393
msext/Class/Common/VoiceConvert/amrwapper/amrFileCodec.mm
Executable file
393
msext/Class/Common/VoiceConvert/amrwapper/amrFileCodec.mm
Executable file
@@ -0,0 +1,393 @@
|
||||
//
|
||||
// amrFileCodec.cpp
|
||||
// amrDemoForiOS
|
||||
//
|
||||
// Created by Tang Xiaoping on 9/27/11.
|
||||
// Copyright 2011 test. All rights reserved.
|
||||
//
|
||||
|
||||
#include "amrFileCodec.h"
|
||||
int amrEncodeMode[] = {4750, 5150, 5900, 6700, 7400, 7950, 10200, 12200}; // amr 编码方式
|
||||
// 从WAVE文件中跳过WAVE文件头,直接到PCM音频数据
|
||||
void SkipToPCMAudioData(FILE* fpwave)
|
||||
{
|
||||
RIFFHEADER riff;
|
||||
FMTBLOCK fmt;
|
||||
XCHUNKHEADER chunk;
|
||||
WAVEFORMATX wfx;
|
||||
int bDataBlock = 0;
|
||||
|
||||
// 1. 读RIFF头
|
||||
fread(&riff, 1, sizeof(RIFFHEADER), fpwave);
|
||||
|
||||
// 2. 读FMT块 - 如果 fmt.nFmtSize>16 说明需要还有一个附属大小没有读
|
||||
fread(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
|
||||
if ( chunk.nChunkSize>16 )
|
||||
{
|
||||
fread(&wfx, 1, sizeof(WAVEFORMATX), fpwave);
|
||||
}
|
||||
else
|
||||
{
|
||||
memcpy(fmt.chFmtID, chunk.chChunkID, 4);
|
||||
fmt.nFmtSize = chunk.nChunkSize;
|
||||
fread(&fmt.wf, 1, sizeof(WAVEFORMAT), fpwave);
|
||||
}
|
||||
|
||||
// 3.转到data块 - 有些还有fact块等。
|
||||
while(!bDataBlock)
|
||||
{
|
||||
fread(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
|
||||
if ( !memcmp(chunk.chChunkID, "data", 4) )
|
||||
{
|
||||
bDataBlock = 1;
|
||||
break;
|
||||
}
|
||||
// 因为这个不是data块,就跳过块数据
|
||||
fseek(fpwave, chunk.nChunkSize, SEEK_CUR);
|
||||
}
|
||||
}
|
||||
|
||||
// 从WAVE文件读一个完整的PCM音频帧
|
||||
// 返回值: 0-错误 >0: 完整帧大小
|
||||
int ReadPCMFrame(short speech[], FILE* fpwave, int nChannels, int nBitsPerSample)
|
||||
{
|
||||
int nRead = 0;
|
||||
int x = 0, y=0;
|
||||
// unsigned short ush1=0, ush2=0, ush=0;
|
||||
|
||||
// 原始PCM音频帧数据
|
||||
unsigned char pcmFrame_8b1[PCM_FRAME_SIZE];
|
||||
unsigned char pcmFrame_8b2[PCM_FRAME_SIZE<<1];
|
||||
unsigned short pcmFrame_16b1[PCM_FRAME_SIZE];
|
||||
unsigned short pcmFrame_16b2[PCM_FRAME_SIZE<<1];
|
||||
|
||||
if (nBitsPerSample==8 && nChannels==1)
|
||||
{
|
||||
|
||||
nRead = fread(pcmFrame_8b1, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
|
||||
|
||||
for(x=0; x<PCM_FRAME_SIZE; x++)
|
||||
{
|
||||
speech[x] =(short)((short)pcmFrame_8b1[x] << 7);
|
||||
}
|
||||
}
|
||||
else
|
||||
if (nBitsPerSample==8 && nChannels==2)
|
||||
{
|
||||
nRead = fread(pcmFrame_8b2, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
|
||||
for( x=0, y=0; y<PCM_FRAME_SIZE; y++,x+=2 )
|
||||
{
|
||||
// 1 - 取两个声道之左声道
|
||||
speech[y] =(short)((short)pcmFrame_8b2[x+0] << 7);
|
||||
// 2 - 取两个声道之右声道
|
||||
//speech[y] =(short)((short)pcmFrame_8b2[x+1] << 7);
|
||||
// 3 - 取两个声道的平均值
|
||||
//ush1 = (short)pcmFrame_8b2[x+0];
|
||||
//ush2 = (short)pcmFrame_8b2[x+1];
|
||||
//ush = (ush1 + ush2) >> 1;
|
||||
//speech[y] = (short)((short)ush << 7);
|
||||
}
|
||||
}
|
||||
else
|
||||
if (nBitsPerSample==16 && nChannels==1)
|
||||
{
|
||||
nRead = fread(pcmFrame_16b1, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
|
||||
for(x=0; x<PCM_FRAME_SIZE; x++)
|
||||
{
|
||||
speech[x] = (short)pcmFrame_16b1[x+0];
|
||||
}
|
||||
}
|
||||
else
|
||||
if (nBitsPerSample==16 && nChannels==2)
|
||||
{
|
||||
nRead = fread(pcmFrame_16b2, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
|
||||
for( x=0, y=0; y<PCM_FRAME_SIZE; y++,x+=2 )
|
||||
{
|
||||
//speech[y] = (short)pcmFrame_16b2[x+0];
|
||||
speech[y] = (short)((int)((int)pcmFrame_16b2[x+0] + (int)pcmFrame_16b2[x+1])) >> 1;
|
||||
}
|
||||
}
|
||||
|
||||
// 如果读到的数据不是一个完整的PCM帧, 就返回0
|
||||
if (nRead<PCM_FRAME_SIZE*nChannels) return 0;
|
||||
|
||||
return nRead;
|
||||
}
|
||||
|
||||
// WAVE音频采样频率是8khz
|
||||
// 音频样本单元数 = 8000*0.02 = 160 (由采样频率决定)
|
||||
// 声道数 1 : 160
|
||||
// 2 : 160*2 = 320
|
||||
// bps决定样本(sample)大小
|
||||
// bps = 8 --> 8位 unsigned char
|
||||
// 16 --> 16位 unsigned short
|
||||
int EncodeWAVEFileToAMRFile(const char* pchWAVEFilename, const char* pchAMRFileName, int nChannels, int nBitsPerSample)
|
||||
{
|
||||
FILE* fpwave;
|
||||
FILE* fpamr;
|
||||
|
||||
/* input speech vector */
|
||||
short speech[160];
|
||||
|
||||
/* counters */
|
||||
int byte_counter, frames = 0, bytes = 0;
|
||||
|
||||
/* pointer to encoder state structure */
|
||||
void *enstate;
|
||||
|
||||
/* requested mode */
|
||||
enum Mode req_mode = MR122;
|
||||
int dtx = 0;
|
||||
|
||||
/* bitstream filetype */
|
||||
unsigned char amrFrame[MAX_AMR_FRAME_SIZE];
|
||||
|
||||
fpwave = fopen(pchWAVEFilename, "rb");
|
||||
if (fpwave == NULL)
|
||||
{
|
||||
return 0;
|
||||
}
|
||||
|
||||
// 创建并初始化amr文件
|
||||
fpamr = fopen(pchAMRFileName, "wb");
|
||||
if (fpamr == NULL)
|
||||
{
|
||||
fclose(fpwave);
|
||||
return 0;
|
||||
}
|
||||
/* write magic number to indicate single channel AMR file storage format */
|
||||
bytes = fwrite(AMR_MAGIC_NUMBER, sizeof(char), strlen(AMR_MAGIC_NUMBER), fpamr);
|
||||
|
||||
/* skip to pcm audio data*/
|
||||
SkipToPCMAudioData(fpwave);
|
||||
|
||||
enstate = Encoder_Interface_init(dtx);
|
||||
|
||||
while(1)
|
||||
{
|
||||
// read one pcm frame
|
||||
if (!ReadPCMFrame(speech, fpwave, nChannels, nBitsPerSample)) break;
|
||||
|
||||
frames++;
|
||||
|
||||
/* call encoder */
|
||||
byte_counter = Encoder_Interface_Encode(enstate, req_mode, speech, amrFrame, 0);
|
||||
|
||||
bytes += byte_counter;
|
||||
fwrite(amrFrame, sizeof (unsigned char), byte_counter, fpamr );
|
||||
}
|
||||
|
||||
Encoder_Interface_exit(enstate);
|
||||
|
||||
fclose(fpamr);
|
||||
fclose(fpwave);
|
||||
|
||||
return frames;
|
||||
}
|
||||
|
||||
|
||||
|
||||
|
||||
#pragma mark - Decode
|
||||
//decode
|
||||
void WriteWAVEFileHeader(FILE* fpwave, int nFrame)
|
||||
{
|
||||
char tag[10] = "";
|
||||
|
||||
// 1. 写RIFF头
|
||||
RIFFHEADER riff;
|
||||
strcpy(tag, "RIFF");
|
||||
memcpy(riff.chRiffID, tag, 4);
|
||||
riff.nRiffSize = 4 // WAVE
|
||||
+ sizeof(XCHUNKHEADER) // fmt
|
||||
+ sizeof(WAVEFORMATX) // WAVEFORMATX
|
||||
+ sizeof(XCHUNKHEADER) // DATA
|
||||
+ nFrame*160*sizeof(short); //
|
||||
strcpy(tag, "WAVE");
|
||||
memcpy(riff.chRiffFormat, tag, 4);
|
||||
fwrite(&riff, 1, sizeof(RIFFHEADER), fpwave);
|
||||
|
||||
// 2. 写FMT块
|
||||
XCHUNKHEADER chunk;
|
||||
WAVEFORMATX wfx;
|
||||
strcpy(tag, "fmt ");
|
||||
memcpy(chunk.chChunkID, tag, 4);
|
||||
chunk.nChunkSize = sizeof(WAVEFORMATX);
|
||||
fwrite(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
|
||||
memset(&wfx, 0, sizeof(WAVEFORMATX));
|
||||
wfx.nFormatTag = 1;
|
||||
wfx.nChannels = 1; // 单声道
|
||||
wfx.nSamplesPerSec = 8000; // 8khz
|
||||
wfx.nAvgBytesPerSec = 16000;
|
||||
wfx.nBlockAlign = 2;
|
||||
wfx.nBitsPerSample = 16; // 16位
|
||||
fwrite(&wfx, 1, sizeof(WAVEFORMATX), fpwave);
|
||||
|
||||
// 3. 写data块头
|
||||
strcpy(tag, "data");
|
||||
memcpy(chunk.chChunkID, tag, 4);
|
||||
chunk.nChunkSize = nFrame*160*sizeof(short);
|
||||
fwrite(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
|
||||
}
|
||||
|
||||
const int myround(const double x)
|
||||
{
|
||||
return((int)(x+0.5));
|
||||
}
|
||||
|
||||
// 根据帧头计算当前帧大小
|
||||
int caclAMRFrameSize(unsigned char frameHeader)
|
||||
{
|
||||
int mode;
|
||||
int temp1 = 0;
|
||||
int temp2 = 0;
|
||||
int frameSize;
|
||||
|
||||
temp1 = frameHeader;
|
||||
|
||||
// 编码方式编号 = 帧头的3-6位
|
||||
temp1 &= 0x78; // 0111-1000
|
||||
temp1 >>= 3;
|
||||
|
||||
mode = amrEncodeMode[temp1];
|
||||
|
||||
// 计算amr音频数据帧大小
|
||||
// 原理: amr 一帧对应20ms,那么一秒有50帧的音频数据
|
||||
temp2 = myround((double)(((double)mode / (double)AMR_FRAME_COUNT_PER_SECOND) / (double)8));
|
||||
|
||||
frameSize = myround((double)temp2 + 0.5);
|
||||
return frameSize;
|
||||
}
|
||||
|
||||
// 读第一个帧 - (参考帧)
|
||||
// 返回值: 0-出错; 1-正确
|
||||
int ReadAMRFrameFirst(FILE* fpamr, unsigned char frameBuffer[], int* stdFrameSize, unsigned char* stdFrameHeader)
|
||||
{
|
||||
#pragma clang diagnostic push
|
||||
#pragma clang diagnostic ignored "-Wsizeof-array-argument"
|
||||
#pragma clang diagnostic ignored "-Wsizeof-pointer-memaccess"
|
||||
memset(frameBuffer, 0, sizeof(frameBuffer));
|
||||
#pragma clang diagnostic pop
|
||||
|
||||
// 先读帧头
|
||||
fread(stdFrameHeader, 1, sizeof(unsigned char), fpamr);
|
||||
if (feof(fpamr)) return 0;
|
||||
|
||||
// 根据帧头计算帧大小
|
||||
*stdFrameSize = caclAMRFrameSize(*stdFrameHeader);
|
||||
|
||||
// 读首帧
|
||||
frameBuffer[0] = *stdFrameHeader;
|
||||
fread(&(frameBuffer[1]), 1, (*stdFrameSize-1)*sizeof(unsigned char), fpamr);
|
||||
if (feof(fpamr)) return 0;
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
||||
// 返回值: 0-出错; 1-正确
|
||||
int ReadAMRFrame(FILE* fpamr, unsigned char frameBuffer[], int stdFrameSize, unsigned char stdFrameHeader)
|
||||
{
|
||||
int bytes = 0;
|
||||
unsigned char frameHeader; // 帧头
|
||||
#pragma clang diagnostic push
|
||||
#pragma clang diagnostic ignored "-Wsizeof-array-argument"
|
||||
#pragma clang diagnostic ignored "-Wsizeof-pointer-memaccess"
|
||||
memset(frameBuffer, 0, sizeof(frameBuffer));
|
||||
#pragma clang diagnostic pop
|
||||
|
||||
// 读帧头
|
||||
// 如果是坏帧(不是标准帧头),则继续读下一个字节,直到读到标准帧头
|
||||
while(1)
|
||||
{
|
||||
bytes = fread(&frameHeader, 1, sizeof(unsigned char), fpamr);
|
||||
if (feof(fpamr)) return 0;
|
||||
if (frameHeader == stdFrameHeader) break;
|
||||
}
|
||||
|
||||
// 读该帧的语音数据(帧头已经读过)
|
||||
frameBuffer[0] = frameHeader;
|
||||
bytes = fread(&(frameBuffer[1]), 1, (stdFrameSize-1)*sizeof(unsigned char), fpamr);
|
||||
if (feof(fpamr)) return 0;
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
||||
// 将AMR文件解码成WAVE文件
|
||||
int DecodeAMRFileToWAVEFile(const char* pchAMRFileName, const char* pchWAVEFilename)
|
||||
{
|
||||
|
||||
|
||||
FILE* fpamr = NULL;
|
||||
FILE* fpwave = NULL;
|
||||
char magic[8];
|
||||
void * destate;
|
||||
int nFrameCount = 0;
|
||||
int stdFrameSize;
|
||||
unsigned char stdFrameHeader;
|
||||
|
||||
unsigned char amrFrame[MAX_AMR_FRAME_SIZE];
|
||||
short pcmFrame[PCM_FRAME_SIZE];
|
||||
|
||||
// NSString * path = [[NSBundle mainBundle] pathForResource: @"test" ofType: @"amr"];
|
||||
// fpamr = fopen([path cStringUsingEncoding:NSASCIIStringEncoding], "rb");
|
||||
fpamr = fopen(pchAMRFileName, "rb");
|
||||
|
||||
if ( fpamr==NULL ) return 0;
|
||||
|
||||
// 检查amr文件头
|
||||
fread(magic, sizeof(char), strlen(AMR_MAGIC_NUMBER), fpamr);
|
||||
if (strncmp(magic, AMR_MAGIC_NUMBER, strlen(AMR_MAGIC_NUMBER)))
|
||||
{
|
||||
fclose(fpamr);
|
||||
return 0;
|
||||
}
|
||||
|
||||
// 创建并初始化WAVE文件
|
||||
// NSArray *paths = NSSearchPathForDirectoriesInDomains(NSDocumentDirectory, NSUserDomainMask, YES);
|
||||
// NSString *documentPath = [paths objectAtIndex:0];
|
||||
// NSString *docFilePath = [documentPath stringByAppendingPathComponent:[NSString stringWithFormat:@"%s", pchWAVEFilename]];
|
||||
// NSLog(@"documentPath=%@", documentPath);
|
||||
//
|
||||
// fpwave = fopen([docFilePath cStringUsingEncoding:NSASCIIStringEncoding], "wb");
|
||||
fpwave = fopen(pchWAVEFilename,"wb");
|
||||
|
||||
WriteWAVEFileHeader(fpwave, nFrameCount);
|
||||
|
||||
/* init decoder */
|
||||
destate = Decoder_Interface_init();
|
||||
|
||||
// 读第一帧 - 作为参考帧
|
||||
memset(amrFrame, 0, sizeof(amrFrame));
|
||||
memset(pcmFrame, 0, sizeof(pcmFrame));
|
||||
ReadAMRFrameFirst(fpamr, amrFrame, &stdFrameSize, &stdFrameHeader);
|
||||
|
||||
// 解码一个AMR音频帧成PCM数据
|
||||
Decoder_Interface_Decode(destate, amrFrame, pcmFrame, 0);
|
||||
nFrameCount++;
|
||||
fwrite(pcmFrame, sizeof(short), PCM_FRAME_SIZE, fpwave);
|
||||
|
||||
// 逐帧解码AMR并写到WAVE文件里
|
||||
while(1)
|
||||
{
|
||||
memset(amrFrame, 0, sizeof(amrFrame));
|
||||
memset(pcmFrame, 0, sizeof(pcmFrame));
|
||||
if (!ReadAMRFrame(fpamr, amrFrame, stdFrameSize, stdFrameHeader)) break;
|
||||
|
||||
// 解码一个AMR音频帧成PCM数据 (8k-16b-单声道)
|
||||
Decoder_Interface_Decode(destate, amrFrame, pcmFrame, 0);
|
||||
nFrameCount++;
|
||||
fwrite(pcmFrame, sizeof(short), PCM_FRAME_SIZE, fpwave);
|
||||
}
|
||||
printf("frame = %d\n", nFrameCount);
|
||||
Decoder_Interface_exit(destate);
|
||||
|
||||
fclose(fpwave);
|
||||
|
||||
// 重写WAVE文件头
|
||||
// fpwave = fopen([docFilePath cStringUsingEncoding:NSASCIIStringEncoding], "r+");
|
||||
fpwave = fopen(pchWAVEFilename, "r+");
|
||||
WriteWAVEFileHeader(fpwave, nFrameCount);
|
||||
fclose(fpwave);
|
||||
|
||||
return nFrameCount;
|
||||
}
|
||||
Reference in New Issue
Block a user