amrFileCodec.mm 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384
  1. //
  2. // amrFileCodec.cpp
  3. // amrDemoForiOS
  4. //
  5. // Created by Tang Xiaoping on 9/27/11.
  6. // Copyright 2011 test. All rights reserved.
  7. //
  8. #include "amrFileCodec.h"
  9. int amrEncodeMode[] = {4750, 5150, 5900, 6700, 7400, 7950, 10200, 12200}; // amr 编码方式
  10. // 从WAVE文件中跳过WAVE文件头,直接到PCM音频数据
  11. void SkipToPCMAudioData(FILE* fpwave)
  12. {
  13. RIFFHEADER riff;
  14. FMTBLOCK fmt;
  15. XCHUNKHEADER chunk;
  16. WAVEFORMATX wfx;
  17. int bDataBlock = 0;
  18. // 1. 读RIFF头
  19. fread(&riff, 1, sizeof(RIFFHEADER), fpwave);
  20. // 2. 读FMT块 - 如果 fmt.nFmtSize>16 说明需要还有一个附属大小没有读
  21. fread(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
  22. if ( chunk.nChunkSize>16 )
  23. {
  24. fread(&wfx, 1, sizeof(WAVEFORMATX), fpwave);
  25. }
  26. else
  27. {
  28. memcpy(fmt.chFmtID, chunk.chChunkID, 4);
  29. fmt.nFmtSize = chunk.nChunkSize;
  30. fread(&fmt.wf, 1, sizeof(WAVEFORMAT), fpwave);
  31. }
  32. // 3.转到data块 - 有些还有fact块等。
  33. while(!bDataBlock)
  34. {
  35. fread(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
  36. if ( !memcmp(chunk.chChunkID, "data", 4) )
  37. {
  38. bDataBlock = 1;
  39. break;
  40. }
  41. // 因为这个不是data块,就跳过块数据
  42. fseek(fpwave, chunk.nChunkSize, SEEK_CUR);
  43. }
  44. }
  45. // 从WAVE文件读一个完整的PCM音频帧
  46. // 返回值: 0-错误 >0: 完整帧大小
  47. int ReadPCMFrame(short speech[], FILE* fpwave, int nChannels, int nBitsPerSample)
  48. {
  49. int nRead = 0;
  50. int x = 0, y=0;
  51. // unsigned short ush1=0, ush2=0, ush=0;
  52. // 原始PCM音频帧数据
  53. unsigned char pcmFrame_8b1[PCM_FRAME_SIZE];
  54. unsigned char pcmFrame_8b2[PCM_FRAME_SIZE<<1];
  55. unsigned short pcmFrame_16b1[PCM_FRAME_SIZE];
  56. unsigned short pcmFrame_16b2[PCM_FRAME_SIZE<<1];
  57. if (nBitsPerSample==8 && nChannels==1)
  58. {
  59. nRead = fread(pcmFrame_8b1, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
  60. for(x=0; x<PCM_FRAME_SIZE; x++)
  61. {
  62. speech[x] =(short)((short)pcmFrame_8b1[x] << 7);
  63. }
  64. }
  65. else
  66. if (nBitsPerSample==8 && nChannels==2)
  67. {
  68. nRead = fread(pcmFrame_8b2, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
  69. for( x=0, y=0; y<PCM_FRAME_SIZE; y++,x+=2 )
  70. {
  71. // 1 - 取两个声道之左声道
  72. speech[y] =(short)((short)pcmFrame_8b2[x+0] << 7);
  73. // 2 - 取两个声道之右声道
  74. //speech[y] =(short)((short)pcmFrame_8b2[x+1] << 7);
  75. // 3 - 取两个声道的平均值
  76. //ush1 = (short)pcmFrame_8b2[x+0];
  77. //ush2 = (short)pcmFrame_8b2[x+1];
  78. //ush = (ush1 + ush2) >> 1;
  79. //speech[y] = (short)((short)ush << 7);
  80. }
  81. }
  82. else
  83. if (nBitsPerSample==16 && nChannels==1)
  84. {
  85. nRead = fread(pcmFrame_16b1, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
  86. for(x=0; x<PCM_FRAME_SIZE; x++)
  87. {
  88. speech[x] = (short)pcmFrame_16b1[x+0];
  89. }
  90. }
  91. else
  92. if (nBitsPerSample==16 && nChannels==2)
  93. {
  94. nRead = fread(pcmFrame_16b2, (nBitsPerSample/8), PCM_FRAME_SIZE*nChannels, fpwave);
  95. for( x=0, y=0; y<PCM_FRAME_SIZE; y++,x+=2 )
  96. {
  97. //speech[y] = (short)pcmFrame_16b2[x+0];
  98. speech[y] = (short)((int)((int)pcmFrame_16b2[x+0] + (int)pcmFrame_16b2[x+1])) >> 1;
  99. }
  100. }
  101. // 如果读到的数据不是一个完整的PCM帧, 就返回0
  102. if (nRead<PCM_FRAME_SIZE*nChannels) return 0;
  103. return nRead;
  104. }
  105. // WAVE音频采样频率是8khz
  106. // 音频样本单元数 = 8000*0.02 = 160 (由采样频率决定)
  107. // 声道数 1 : 160
  108. // 2 : 160*2 = 320
  109. // bps决定样本(sample)大小
  110. // bps = 8 --> 8位 unsigned char
  111. // 16 --> 16位 unsigned short
  112. int EncodeWAVEFileToAMRFile(const char* pchWAVEFilename, const char* pchAMRFileName, int nChannels, int nBitsPerSample)
  113. {
  114. FILE* fpwave;
  115. FILE* fpamr;
  116. /* input speech vector */
  117. short speech[160];
  118. /* counters */
  119. int byte_counter, frames = 0, bytes = 0;
  120. /* pointer to encoder state structure */
  121. void *enstate;
  122. /* requested mode */
  123. enum Mode req_mode = MR122;
  124. int dtx = 0;
  125. /* bitstream filetype */
  126. unsigned char amrFrame[MAX_AMR_FRAME_SIZE];
  127. fpwave = fopen(pchWAVEFilename, "rb");
  128. if (fpwave == NULL)
  129. {
  130. return 0;
  131. }
  132. // 创建并初始化amr文件
  133. fpamr = fopen(pchAMRFileName, "wb");
  134. if (fpamr == NULL)
  135. {
  136. fclose(fpwave);
  137. return 0;
  138. }
  139. /* write magic number to indicate single channel AMR file storage format */
  140. bytes = fwrite(AMR_MAGIC_NUMBER, sizeof(char), strlen(AMR_MAGIC_NUMBER), fpamr);
  141. /* skip to pcm audio data*/
  142. SkipToPCMAudioData(fpwave);
  143. enstate = Encoder_Interface_init(dtx);
  144. while(1)
  145. {
  146. // read one pcm frame
  147. if (!ReadPCMFrame(speech, fpwave, nChannels, nBitsPerSample)) break;
  148. frames++;
  149. /* call encoder */
  150. byte_counter = Encoder_Interface_Encode(enstate, req_mode, speech, amrFrame, 0);
  151. bytes += byte_counter;
  152. fwrite(amrFrame, sizeof (unsigned char), byte_counter, fpamr );
  153. }
  154. Encoder_Interface_exit(enstate);
  155. fclose(fpamr);
  156. fclose(fpwave);
  157. return frames;
  158. }
  159. #pragma mark - Decode
  160. //decode
  161. void WriteWAVEFileHeader(FILE* fpwave, int nFrame)
  162. {
  163. char tag[10] = "";
  164. // 1. 写RIFF头
  165. RIFFHEADER riff;
  166. strcpy(tag, "RIFF");
  167. memcpy(riff.chRiffID, tag, 4);
  168. riff.nRiffSize = 4 // WAVE
  169. + sizeof(XCHUNKHEADER) // fmt
  170. + sizeof(WAVEFORMATX) // WAVEFORMATX
  171. + sizeof(XCHUNKHEADER) // DATA
  172. + nFrame*160*sizeof(short); //
  173. strcpy(tag, "WAVE");
  174. memcpy(riff.chRiffFormat, tag, 4);
  175. fwrite(&riff, 1, sizeof(RIFFHEADER), fpwave);
  176. // 2. 写FMT块
  177. XCHUNKHEADER chunk;
  178. WAVEFORMATX wfx;
  179. strcpy(tag, "fmt ");
  180. memcpy(chunk.chChunkID, tag, 4);
  181. chunk.nChunkSize = sizeof(WAVEFORMATX);
  182. fwrite(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
  183. memset(&wfx, 0, sizeof(WAVEFORMATX));
  184. wfx.nFormatTag = 1;
  185. wfx.nChannels = 1; // 单声道
  186. wfx.nSamplesPerSec = 8000; // 8khz
  187. wfx.nAvgBytesPerSec = 16000;
  188. wfx.nBlockAlign = 2;
  189. wfx.nBitsPerSample = 16; // 16位
  190. fwrite(&wfx, 1, sizeof(WAVEFORMATX), fpwave);
  191. // 3. 写data块头
  192. strcpy(tag, "data");
  193. memcpy(chunk.chChunkID, tag, 4);
  194. chunk.nChunkSize = nFrame*160*sizeof(short);
  195. fwrite(&chunk, 1, sizeof(XCHUNKHEADER), fpwave);
  196. }
  197. const int myround(const double x)
  198. {
  199. return((int)(x+0.5));
  200. }
  201. // 根据帧头计算当前帧大小
  202. int caclAMRFrameSize(unsigned char frameHeader)
  203. {
  204. int mode;
  205. int temp1 = 0;
  206. int temp2 = 0;
  207. int frameSize;
  208. temp1 = frameHeader;
  209. // 编码方式编号 = 帧头的3-6位
  210. temp1 &= 0x78; // 0111-1000
  211. temp1 >>= 3;
  212. mode = amrEncodeMode[temp1];
  213. // 计算amr音频数据帧大小
  214. // 原理: amr 一帧对应20ms,那么一秒有50帧的音频数据
  215. temp2 = myround((double)(((double)mode / (double)AMR_FRAME_COUNT_PER_SECOND) / (double)8));
  216. frameSize = myround((double)temp2 + 0.5);
  217. return frameSize;
  218. }
  219. // 读第一个帧 - (参考帧)
  220. // 返回值: 0-出错; 1-正确
  221. int ReadAMRFrameFirst(FILE* fpamr, unsigned char frameBuffer[], int* stdFrameSize, unsigned char* stdFrameHeader)
  222. {
  223. memset(frameBuffer, 0, sizeof(frameBuffer));
  224. // 先读帧头
  225. fread(stdFrameHeader, 1, sizeof(unsigned char), fpamr);
  226. if (feof(fpamr)) return 0;
  227. // 根据帧头计算帧大小
  228. *stdFrameSize = caclAMRFrameSize(*stdFrameHeader);
  229. // 读首帧
  230. frameBuffer[0] = *stdFrameHeader;
  231. fread(&(frameBuffer[1]), 1, (*stdFrameSize-1)*sizeof(unsigned char), fpamr);
  232. if (feof(fpamr)) return 0;
  233. return 1;
  234. }
  235. // 返回值: 0-出错; 1-正确
  236. int ReadAMRFrame(FILE* fpamr, unsigned char frameBuffer[], int stdFrameSize, unsigned char stdFrameHeader)
  237. {
  238. int bytes = 0;
  239. unsigned char frameHeader; // 帧头
  240. memset(frameBuffer, 0, sizeof(frameBuffer));
  241. // 读帧头
  242. // 如果是坏帧(不是标准帧头),则继续读下一个字节,直到读到标准帧头
  243. while(1)
  244. {
  245. bytes = fread(&frameHeader, 1, sizeof(unsigned char), fpamr);
  246. if (feof(fpamr)) return 0;
  247. if (frameHeader == stdFrameHeader) break;
  248. }
  249. // 读该帧的语音数据(帧头已经读过)
  250. frameBuffer[0] = frameHeader;
  251. bytes = fread(&(frameBuffer[1]), 1, (stdFrameSize-1)*sizeof(unsigned char), fpamr);
  252. if (feof(fpamr)) return 0;
  253. return 1;
  254. }
  255. // 将AMR文件解码成WAVE文件
  256. int DecodeAMRFileToWAVEFile(const char* pchAMRFileName, const char* pchWAVEFilename)
  257. {
  258. FILE* fpamr = NULL;
  259. FILE* fpwave = NULL;
  260. char magic[8];
  261. void * destate;
  262. int nFrameCount = 0;
  263. int stdFrameSize;
  264. unsigned char stdFrameHeader;
  265. unsigned char amrFrame[MAX_AMR_FRAME_SIZE];
  266. short pcmFrame[PCM_FRAME_SIZE];
  267. // NSString * path = [[NSBundle mainBundle] pathForResource: @"test" ofType: @"amr"];
  268. // fpamr = fopen([path cStringUsingEncoding:NSASCIIStringEncoding], "rb");
  269. fpamr = fopen(pchAMRFileName, "rb");
  270. if ( fpamr==NULL ) return 0;
  271. // 检查amr文件头
  272. fread(magic, sizeof(char), strlen(AMR_MAGIC_NUMBER), fpamr);
  273. if (strncmp(magic, AMR_MAGIC_NUMBER, strlen(AMR_MAGIC_NUMBER)))
  274. {
  275. fclose(fpamr);
  276. return 0;
  277. }
  278. // 创建并初始化WAVE文件
  279. // NSArray *paths = NSSearchPathForDirectoriesInDomains(NSDocumentDirectory, NSUserDomainMask, YES);
  280. // NSString *documentPath = [paths objectAtIndex:0];
  281. // NSString *docFilePath = [documentPath stringByAppendingPathComponent:[NSString stringWithFormat:@"%s", pchWAVEFilename]];
  282. // NSLog(@"documentPath=%@", documentPath);
  283. //
  284. // fpwave = fopen([docFilePath cStringUsingEncoding:NSASCIIStringEncoding], "wb");
  285. fpwave = fopen(pchWAVEFilename,"wb");
  286. WriteWAVEFileHeader(fpwave, nFrameCount);
  287. /* init decoder */
  288. destate = Decoder_Interface_init();
  289. // 读第一帧 - 作为参考帧
  290. memset(amrFrame, 0, sizeof(amrFrame));
  291. memset(pcmFrame, 0, sizeof(pcmFrame));
  292. ReadAMRFrameFirst(fpamr, amrFrame, &stdFrameSize, &stdFrameHeader);
  293. // 解码一个AMR音频帧成PCM数据
  294. Decoder_Interface_Decode(destate, amrFrame, pcmFrame, 0);
  295. nFrameCount++;
  296. fwrite(pcmFrame, sizeof(short), PCM_FRAME_SIZE, fpwave);
  297. // 逐帧解码AMR并写到WAVE文件里
  298. while(1)
  299. {
  300. memset(amrFrame, 0, sizeof(amrFrame));
  301. memset(pcmFrame, 0, sizeof(pcmFrame));
  302. if (!ReadAMRFrame(fpamr, amrFrame, stdFrameSize, stdFrameHeader)) break;
  303. // 解码一个AMR音频帧成PCM数据 (8k-16b-单声道)
  304. Decoder_Interface_Decode(destate, amrFrame, pcmFrame, 0);
  305. nFrameCount++;
  306. fwrite(pcmFrame, sizeof(short), PCM_FRAME_SIZE, fpwave);
  307. }
  308. // NSLog(@"frame = %d", nFrameCount);
  309. Decoder_Interface_exit(destate);
  310. fclose(fpwave);
  311. // 重写WAVE文件头
  312. // fpwave = fopen([docFilePath cStringUsingEncoding:NSASCIIStringEncoding], "r+");
  313. fpwave = fopen(pchWAVEFilename, "r+");
  314. WriteWAVEFileHeader(fpwave, nFrameCount);
  315. fclose(fpwave);
  316. return nFrameCount;
  317. }