audio_session.cpp 31 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010
  1. #include "stdafx.h"
  2. #include "SpBase.h"
  3. #include "audio_session.h"
  4. #include <memutil.h>
  5. #include <rtp.h>
  6. #include <rtpsession.h>
  7. #include <audioframework.h>
  8. #include <portaudio.h>
  9. #include "libaudioqueue.h"
  10. #include "rvc_media_common.h"
  11. #define AUDIO_CLOCK 8000
  12. #define AUDIO_SHM_FRAME_TIME 20 // 20ms
  13. #ifndef RVC_MAX_BUFFER_LEN
  14. #define RVC_MAX_BUFFER_LEN 1024
  15. #endif
  16. #ifndef RVC_AUDIO_FRAME_LEN
  17. #define RVC_AUDIO_FRAME_LEN 320
  18. #endif
  19. char straudiodata[RVC_MAX_BUFFER_LEN] = {0};
  20. int iIndex = 0;
  21. int iLastLeft = 0;
  22. static int g_nAudioRecvNum = 0;
  23. static int g_nAudioSendNum = 0;
  24. enum e_media_dir
  25. {
  26. DIR_NONE = 0,
  27. DIR_TX = 1,
  28. DIR_RX = 2,
  29. DIR_BOTH = 3,
  30. };
  31. typedef struct audio_recorder_t audio_recorder_t;
  32. typedef struct audio_phonemedia_t audio_phonemedia_t;
  33. struct audio_session_t
  34. {
  35. audio_session_conf_t conf;
  36. audio_session_phonemedia_conf_t phonemedia_conf;
  37. audio_session_t *owner;
  38. apr_pool_t *pool;
  39. audioengine_t *engine;
  40. audiocontext_t *context;
  41. audiobridge_t *bridge;
  42. apr_pool_t *micspk_pool;
  43. audiomicspk2_t *micspkstream;
  44. audiodsp_t *dspstream;
  45. audioresize_t *resizestream;
  46. audiortp_t *rtpstream;
  47. audiocodec_t *codecstream;
  48. rtp_session_t *rtpsess;
  49. Clibaudioqueue*remoteaudioqueue;
  50. bool brtpinsertqueue;
  51. bool baudiorecved;
  52. };
  53. static int on_rx_audio(char *frame,void*userdata)
  54. {
  55. audio_session_t*session = (audio_session_t*)userdata;
  56. int used = 0;
  57. if (DOUBLERECORD_CALLTYPE != session->phonemedia_conf.eCalltype)
  58. {
  59. if (frame)
  60. {
  61. audio_frame frm;
  62. frm.bitspersample = 16;
  63. frm.format = 1;
  64. frm.data = frame;
  65. frm.framesize = 160; //注意此参数可能不准确,网络传输的包大小可能是不定长的,取音频数据时慎用此参数
  66. //写入实际的单个包大小
  67. //frm.framesize = strlen(frame); //不能使用此方法,网络传输的包大小可能是不定长的
  68. frm.nchannels = 1;
  69. frm.samplespersec = 8000;
  70. if (!session->remoteaudioqueue->InsertAudio(&frm))
  71. {
  72. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("InsertAudio failed! frameCount:%d", frm.framesize);
  73. used = -1;
  74. }
  75. }
  76. }
  77. return used;
  78. }
  79. static void m_on_send_hook(const char *buf, int size, void *arg)
  80. {
  81. g_nAudioSendNum++;
  82. }
  83. static bool phonemedia_rtp_record(audio_session_t* pseesion)
  84. {
  85. bool bret = false;
  86. if (NULL == pseesion){
  87. return bret;
  88. }
  89. if (true == pseesion->brtpinsertqueue){
  90. if (DOUBLERECORD_CALLTYPE == pseesion->phonemedia_conf.eCalltype){
  91. if (eStand2sType == pseesion->phonemedia_conf.eDeviceType){
  92. if (DEV_PICKUP == pseesion->phonemedia_conf.dev_type){
  93. bret = true;
  94. }
  95. }
  96. }
  97. }
  98. return bret;
  99. }
  100. static void m_on_recv_hook(const char *buf, int size, void *arg)
  101. {
  102. rtp_hdr *hdr = (rtp_hdr*)buf;
  103. audio_session_t* psession = (audio_session_t*)arg;
  104. if (false == psession->baudiorecved){
  105. //char strmsg[MAX_PATH] = { 0 };
  106. //_snprintf(strmsg, MAX_PATH, "received first audio packet, and packet size is %d, rtp port (%d <-----> %d).", size, psession->phonemedia_conf.local_rtp_port, psession->phonemedia_conf.remote_rtp_port);
  107. //LogWarn(Severity_Low, Error_Debug, EVENT_MOD_SIP_AUDIO_STREAM_RECEIVED, strmsg);
  108. //DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)(strmsg);
  109. psession->baudiorecved = true;
  110. }
  111. if ((g_nAudioRecvNum%100) == 0){
  112. //DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("recv audio pkt num %d, single size %d",g_nAudioRecvNum,size);
  113. //if (psession->phonemedia_conf.eDeviceType == eStand2sType){
  114. //DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("current hand free flag is %d, call type = %d, pt = %d,arg addr is 0x%08x.",(int)psession->phonemedia_conf.dev_type, psession->phonemedia_conf.eCalltype, hdr->pt, arg);
  115. //}
  116. }
  117. if (0 == psession->phonemedia_conf.dev_type && DOUBLERECORD_CALLTYPE == psession->phonemedia_conf.eCalltype){
  118. if (false == psession->brtpinsertqueue){
  119. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("rtp stream insert to audio queue flag is set to true.");
  120. }
  121. psession->brtpinsertqueue = true;
  122. }
  123. g_nAudioRecvNum++;
  124. if (true == phonemedia_rtp_record(psession)){
  125. char strbuffer[RVC_MAX_BUFFER_LEN]={0};
  126. int outsize = RVC_MAX_BUFFER_LEN;
  127. switch(hdr->pt)
  128. {
  129. case RTP_PT_PCMA:
  130. audiocodec_pcma_decode(buf+sizeof(rtp_hdr), size-sizeof(rtp_hdr), strbuffer, &outsize);
  131. break;
  132. case RTP_PT_PCMU:
  133. audiocodec_pcmu_decode(buf+sizeof(rtp_hdr), size-sizeof(rtp_hdr), strbuffer, &outsize);
  134. break;
  135. case RTP_PT_G729:
  136. audiocodec_g729a_decode(buf+sizeof(rtp_hdr), size-sizeof(rtp_hdr), strbuffer, &outsize);
  137. break;
  138. default:
  139. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("audiocodec_decode not support audio pt(%d).", hdr->pt);
  140. break;
  141. }
  142. if (psession && psession->remoteaudioqueue){
  143. int iCount = (outsize+iLastLeft)/RVC_AUDIO_FRAME_LEN;
  144. memcpy(straudiodata+iLastLeft, strbuffer, iCount*RVC_AUDIO_FRAME_LEN-iLastLeft);
  145. for(int i = 0; i < iCount; i++)
  146. {
  147. audio_frame frm;
  148. char straudio[RVC_AUDIO_FRAME_LEN]={0};
  149. memcpy(straudio, straudiodata+i*RVC_AUDIO_FRAME_LEN, RVC_AUDIO_FRAME_LEN);
  150. frm.bitspersample = 16;
  151. frm.format = 1;
  152. frm.data = straudio;
  153. frm.framesize = RVC_AUDIO_FRAME_LEN; //注意此参数可能不准确,网络传输的包大小可能是不定长的,取音频数据时慎用此参数
  154. frm.nchannels = 1;
  155. frm.samplespersec = 8000;
  156. if (!psession->remoteaudioqueue->InsertAudio(&frm))
  157. {
  158. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("InsertAudio failed! frameCount:%d", frm.framesize);
  159. }
  160. }
  161. memset(straudiodata, 0, RVC_MAX_BUFFER_LEN); //清空缓存
  162. iLastLeft = (outsize + iLastLeft) % RVC_AUDIO_FRAME_LEN; //上次剩余不足RVC_AUDIO_FRAME_LEN的buffer
  163. if ((0 != iLastLeft) && (iCount*RVC_AUDIO_FRAME_LEN < outsize)){
  164. memcpy(straudiodata, strbuffer+iCount*RVC_AUDIO_FRAME_LEN, iLastLeft); //暂存上一次的未入队列的音频数据
  165. }
  166. }
  167. else{
  168. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("pseesion->remoteaudioqueue is null.");
  169. }
  170. }
  171. }
  172. static void audio_device_event(int bopen, int iret, int bmicro, int idev, const char* strmessage, void* user_data)
  173. {
  174. char strinfo[MAX_PATH] = { 0 };
  175. DWORD errorcode = 0;
  176. if (bopen){
  177. if (DEV_PICKUP == idev) {
  178. char strpickup[] = "[pickup]";
  179. _snprintf(strinfo, MAX_PATH, "%s%s", strmessage, strpickup);
  180. if (0 == iret) {
  181. if (bmicro) {
  182. errorcode = EVENT_MOD_SIP_PICKUP_IN_AUDIO_DEVICE_OPEN_SUCCESS;
  183. }
  184. else {
  185. errorcode = EVENT_MOD_SIP_PICKUP_OUT_AUDIO_DEVICE_OPEN_SUCCESS;
  186. }
  187. }
  188. else {
  189. if (bmicro) {
  190. errorcode = EVENT_MOD_SIP_PICKUP_IN_AUDIO_DEVICE_OPEN_FAILED;
  191. }
  192. else {
  193. errorcode = EVENT_MOD_SIP_PICKUP_OUT_AUDIO_DEVICE_OPEN_FAILED;
  194. }
  195. }
  196. }
  197. else {
  198. char strhandfree[] = "[hand free]";
  199. _snprintf(strinfo, MAX_PATH, "%s%s", strmessage, strhandfree);
  200. if (0 == iret) {
  201. if (bmicro) {
  202. errorcode = EVENT_MOD_SIP_HANDFREE_IN_AUDIO_DEVICE_OPEN_SUCCESS;
  203. }
  204. else {
  205. errorcode = EVENT_MOD_SIP_HANDFREE_OUT_AUDIO_DEVICE_OPEN_SUCCESS;
  206. }
  207. }
  208. else {
  209. if (bmicro) {
  210. errorcode = EVENT_MOD_SIP_HANDFREE_IN_AUDIO_DEVICE_OPEN_FAILED;
  211. }
  212. else {
  213. errorcode = EVENT_MOD_SIP_HANDFREE_OUT_AUDIO_DEVICE_OPEN_FAILED;
  214. }
  215. }
  216. }
  217. }
  218. else {
  219. if (DEV_PICKUP == idev) {
  220. char strpickup[] = "[pickup]";
  221. _snprintf(strinfo, MAX_PATH, "%s%s", strmessage, strpickup);
  222. if (bmicro) {
  223. errorcode = EVENT_MOD_SIP_PICKUP_IN_AUDIO_DEVICE_CLOSE;
  224. }
  225. else {
  226. errorcode = EVENT_MOD_SIP_PICKUP_OUT_AUDIO_DEVICE_CLOSE;
  227. }
  228. }
  229. else {
  230. char strhandfree[] = "[hand free]";
  231. _snprintf(strinfo, MAX_PATH, "%s%s", strmessage, strhandfree);
  232. if (bmicro) {
  233. errorcode = EVENT_MOD_SIP_HANDFREE_IN_AUDIO_DEVICE_CLOSE;
  234. }
  235. else {
  236. errorcode = EVENT_MOD_SIP_HANDFREE_OUT_AUDIO_DEVICE_CLOSE;
  237. }
  238. }
  239. }
  240. LogWarn(Severity_Low, Error_Debug, errorcode, strinfo);
  241. }
  242. static void m_on_recv_hook_backup(const char *buf, int size, void *arg)
  243. {
  244. rtp_hdr *hdr = (rtp_hdr*)buf;
  245. audio_session_t* pseesion = (audio_session_t*)arg;
  246. g_nAudioRecvNum++;
  247. //if ((g_nAudioRecvNum%60) == 0)
  248. //{
  249. // DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("recv audio pkt num %d,single size %d",g_nAudioRecvNum,size);
  250. // DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("pt = %d,arg addr is 0x%08x.",hdr->pt, arg);
  251. //}
  252. if (g_nAudioRecvNum % 2)
  253. {
  254. memset(straudiodata, 0, RVC_MAX_BUFFER_LEN);
  255. memcpy(straudiodata, buf+sizeof(rtp_hdr), size-sizeof(rtp_hdr));
  256. iIndex = (size-sizeof(rtp_hdr));
  257. }
  258. else
  259. {
  260. memcpy(straudiodata+iIndex, buf+sizeof(rtp_hdr), size-sizeof(rtp_hdr));
  261. iIndex = 0;
  262. char strbuffer[RVC_MAX_BUFFER_LEN]={0};
  263. int outsize = RVC_MAX_BUFFER_LEN;
  264. switch(hdr->pt)
  265. {
  266. case RTP_PT_PCMA:
  267. audiocodec_pcma_decode(straudiodata, 2*(size-sizeof(rtp_hdr)), strbuffer, &outsize);
  268. break;
  269. case RTP_PT_PCMU:
  270. audiocodec_pcmu_decode(straudiodata, 2*(size-sizeof(rtp_hdr)), strbuffer, &outsize);
  271. break;
  272. case RTP_PT_G729:
  273. audiocodec_g729a_decode(straudiodata, 2*(size-sizeof(rtp_hdr)), strbuffer, &outsize);
  274. break;
  275. default:
  276. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("audiocodec_decode not support audio pt(%d).", hdr->pt);
  277. break;
  278. }
  279. if (pseesion && pseesion->remoteaudioqueue){
  280. int iCount = outsize/320;
  281. for(int i = 0; i < iCount; i++)
  282. {
  283. audio_frame frm;
  284. char straudio[320]={0};
  285. memcpy(straudio, strbuffer+i*320, 320);
  286. frm.bitspersample = 16;
  287. frm.format = 1;
  288. frm.data = straudio;
  289. frm.framesize = 320; //注意此参数可能不准确,网络传输的包大小可能是不定长的,取音频数据时慎用此参数
  290. ////写入实际的单个包大小
  291. //frm.framesize = strlen(frame); //不能使用此方法,网络传输的包大小可能是不定长的
  292. frm.nchannels = 1;
  293. frm.samplespersec = 8000;
  294. if (!pseesion->remoteaudioqueue->InsertAudio(&frm))
  295. {
  296. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("InsertAudio failed! frameCount:%d", frm.framesize);
  297. }
  298. }
  299. }
  300. else{
  301. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("pseesion->remoteaudioqueue is null.");
  302. }
  303. }
  304. }
  305. //static int translate_id(int in_direction, int idx);
  306. static int phonemedia_stop(audio_session_t *session, int b_record_turn_off);
  307. static void phonemedia_reconfig(audio_session_t *media, const audio_session_phonemedia_conf_t *conf)
  308. {
  309. memcpy(&media->phonemedia_conf, conf, sizeof(audio_session_phonemedia_conf_t));
  310. }
  311. static int phonemedia_start(audio_session_t *session)
  312. {
  313. audio_session_t *media = session;
  314. audio_session_phonemedia_conf_t *conf = &media->phonemedia_conf;
  315. apr_status_t status;
  316. int rc;
  317. int opt_micspk;
  318. const char *in_dev;
  319. const char *out_dev;
  320. int in_agc;
  321. int out_agc;
  322. int in_ns;
  323. int out_ns;
  324. int aec;
  325. const char *codec;
  326. int istoptype;
  327. in_dev = &session->conf.in_dev[conf->dev_type][0];
  328. out_dev = &session->conf.out_dev[conf->dev_type][0];
  329. istoptype = media->conf.istoptype;
  330. opt_micspk = AMS_OPT_AS_STREAM;
  331. if (conf->dir & DIR_TX) {
  332. opt_micspk |= AMS_OPT_PLAY;
  333. }
  334. if (conf->dir &DIR_RX) {
  335. opt_micspk |= AMS_OPT_RECORD;
  336. }
  337. in_agc = media->conf.agc_in[conf->dev_type];
  338. out_agc = media->conf.agc_out[conf->dev_type];
  339. in_ns = media->conf.ns_in[conf->dev_type];
  340. out_ns = media->conf.ns_out[conf->dev_type];
  341. aec = media->conf.aec[conf->dev_type];
  342. switch (conf->local_pt) {
  343. case 0:
  344. codec = "PCMU";
  345. if (conf->local_ptime == 0)
  346. conf->local_ptime = 20;
  347. if (conf->remote_ptime == 0)
  348. conf->remote_ptime = 20;
  349. break;
  350. #if 0
  351. case 4:
  352. codec = "G723";
  353. if (conf->local_ptime == 0)
  354. conf->local_ptime = 30;
  355. if (conf->remote_ptime == 0)
  356. conf->remote_ptime = 30;
  357. break;
  358. #endif
  359. case 8:
  360. codec = "PCMA";
  361. if (conf->local_ptime == 0)
  362. conf->local_ptime = 20;
  363. if (conf->remote_ptime == 0)
  364. conf->remote_ptime = 20;
  365. break;
  366. case 18:
  367. codec = "G729";
  368. if (conf->local_ptime == 0)
  369. conf->local_ptime = 20;
  370. if (conf->remote_ptime == 0)
  371. conf->remote_ptime = 20;
  372. break;
  373. default:
  374. codec = NULL;
  375. break;
  376. }
  377. if (codec == NULL)
  378. goto on_error;
  379. //assert(conf->local_ptime == conf->remote_ptime);
  380. if (conf->local_ptime != conf->remote_ptime) {
  381. conf->local_ptime = conf->remote_ptime;
  382. }
  383. status = apr_pool_create(&media->pool, NULL);
  384. if (status != APR_SUCCESS) {
  385. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_APR_POOL_CREATE_FAILED, "create media pool failed!");
  386. return Error_Resource;
  387. }
  388. status = audioengine_create(media->pool, &media->engine);
  389. if (status != APR_SUCCESS) {
  390. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_ENGINE_CREATE_FAILED, "create audio engine failed!");
  391. goto on_error;
  392. }
  393. status = audioengine_start(media->engine);
  394. if (status != APR_SUCCESS) {
  395. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_ENGINE_START_FAILED, "audio engine start failed!");
  396. goto on_error;
  397. }
  398. rc = rtp_session_create2(conf->local_rtp_ip, conf->local_rtp_port,
  399. 2, &media->rtpsess);
  400. if (rc != 0) {
  401. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_RTP_SESSION_CREATE_FAILED, CSimpleStringA::Format("audio rtp session create2 failed and local port is %d, rc=%d", conf->local_rtp_port, rc).GetData());
  402. //LogWarn(Severity_Middle, Error_Debug, EVENT_MOD_SIP_AUDIO_RTP_CREATE, strmsg);
  403. goto on_error;
  404. }
  405. //rc = rtp_session_reset2(media->rtpsess, conf->dir|RTP_SESSION_FLAG_NO_RTCP, conf->remote_rtp_ip, conf->remote_rtp_port, conf->remote_rtp_port+1);
  406. rc = rtp_session_reset2(media->rtpsess, conf->dir, conf->remote_rtp_ip, conf->remote_rtp_port, conf->remote_rtp_port+1);
  407. if (rc != 0) {
  408. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_RTP_SESSION_RESET_FAILED, "audio rtp session reset failed!");
  409. goto on_error;
  410. }
  411. status = audiobridge_create(media->pool, media->engine, &media->bridge);
  412. if (status != APR_SUCCESS){
  413. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_BRIDGE_CREATE_FAILED, "audio bridge create failed!");
  414. goto on_error;
  415. }
  416. status = apr_pool_create(&media->micspk_pool, media->pool);
  417. if (status != APR_SUCCESS){
  418. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_APR_POOL_CREATE_FAILED, "create media micspk_pool failed!");
  419. goto on_error;
  420. }
  421. if (in_agc)
  422. opt_micspk |= AMS2_OPT_AGC;
  423. if (in_ns)
  424. opt_micspk |= AMS2_OPT_NS;
  425. if (aec)
  426. opt_micspk |= AMS2_OPT_AEC;
  427. //create Spk
  428. status = audiomicspk2_create(media->micspk_pool, media->engine, opt_micspk, AUDIO_CLOCK, in_dev, out_dev, istoptype, conf->dev_type, &audio_device_event, &media->micspkstream);
  429. if (status != APR_SUCCESS){
  430. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_MICSPK2_CREATE_FAILED, "create audio micspk2(windows) failed!");
  431. goto on_error;
  432. }
  433. //音频回调
  434. media->micspkstream->user_data = media;
  435. media->micspkstream->on_rx_audio = &on_rx_audio;
  436. //status = audiomicspk3_create(media->micspk_pool, media->engine, opt_micspk, AUDIO_CLOCK, in_dev, out_dev, &media->micspkstream);
  437. if (out_agc || out_ns) {
  438. int read_opt = AUDIO_DSP_NONE;
  439. int write_opt = AUDIO_DSP_NONE;
  440. if (out_agc)
  441. write_opt |= AUDIO_DSP_AGC;
  442. if (out_ns)
  443. write_opt |= AUDIO_DSP_DENOISE;
  444. status = audiodsp_create(media->micspk_pool, media->engine, read_opt, write_opt, AUDIO_CLOCK, &media->dspstream);
  445. if (status != APR_SUCCESS){
  446. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_DSP_CREATE_FAILED, "create audio dsp failed!");
  447. goto on_error;
  448. }
  449. }
  450. #if 0
  451. status = audioaec_create(media->pool, media->engine, AUDIO_CLOCK, FRAME_TIME,
  452. AUDIO_AEC_OPT_READ_AS_CAPTURE, &media->aecstream);
  453. if (status != APR_SUCCESS)
  454. goto on_error;
  455. #endif
  456. status = audioresize_create(media->pool, media->engine, FRAME_TIME*2*AUDIO_CLOCK/1000,
  457. conf->remote_ptime*2*AUDIO_CLOCK/1000, FRAME_TIME*2*AUDIO_CLOCK/1000,
  458. conf->local_ptime*2*AUDIO_CLOCK/1000, &media->resizestream);
  459. if (status != APR_SUCCESS){
  460. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_RESIZE_CREATE_FAILED, "create audio resize failed!");
  461. goto on_error;
  462. }
  463. status = audiocodec_create(media->pool, media->engine, codec, AUDIO_CLOCK, FRAME_TIME,
  464. AUDIO_CODEC_OPT_ENCODE_WRITE, &media->codecstream);
  465. if (status != APR_SUCCESS){
  466. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_CODEC_CREATE_FAILED, "create audio codec failed!");
  467. goto on_error;
  468. }
  469. status = audiortp_create(media->pool, media->engine, media->rtpsess, &media->rtpstream);
  470. if (status != APR_SUCCESS){
  471. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_RTP_CREATE_FAILED, "create audio rtp failed!");
  472. goto on_error;
  473. }
  474. g_nAudioRecvNum = 0;
  475. g_nAudioSendNum = 0;
  476. {
  477. int param;
  478. param = AUDIO_CLOCK;
  479. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_SEND_CLOCK, &param);
  480. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_RECV_CLOCK, &param);
  481. param = conf->local_pt;
  482. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_SEND_PT, &param);
  483. param = conf->remote_pt;
  484. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_RECV_PT, &param);
  485. param = conf->local_dtmf_pt;
  486. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_SEND_DTMF, &param);
  487. param = conf->remote_dtmf_pt;
  488. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_RECV_DTMF, &param);
  489. param = conf->local_ptime;
  490. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_SEND_PTIME, &param);
  491. param = conf->remote_ptime;
  492. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_RECV_PTIME, &param);
  493. //media->rtpstream->m_on_send_hook = &m_on_recv_hook;
  494. //DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("recv hook addr %d,send hook addr %d", &m_on_recv_hook,&m_on_send_hook);
  495. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_HOOK_ARG, media);
  496. //DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("AUDIO_RTP_FLAG_HOOK_ARG addr is 0x%08x.", media);
  497. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_RECV_HOOK, &m_on_recv_hook);
  498. audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_SEND_HOOK, &m_on_send_hook);
  499. //audiortp_set_param(media->rtpstream, AUDIO_RTP_FLAG_HOOK_ARG, media->rtpstream);
  500. audiortp_init(media->rtpstream);
  501. }
  502. if (conf->dir == DIR_TX)
  503. {
  504. if (media->dspstream)
  505. {
  506. audiostream_connect_pipeline(STREAM_DIR_READ, &media->micspkstream->base, &media->dspstream->base, NULL);
  507. }
  508. else
  509. {
  510. audiostream_connect_pipeline(STREAM_DIR_READ, &media->micspkstream->base, NULL);
  511. }
  512. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_LEFT, &media->micspkstream->base);
  513. audiostream_connect_pipeline(STREAM_DIR_WRITE, &media->resizestream->base, &media->codecstream->base, &media->rtpstream->base, NULL);
  514. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_RIGHT, &media->resizestream->base);
  515. }
  516. else if (conf->dir == DIR_RX)
  517. {
  518. if (media->dspstream)
  519. {
  520. audiostream_connect_pipeline(STREAM_DIR_WRITE, &media->micspkstream->base, &media->dspstream->base, NULL);
  521. }
  522. else
  523. {
  524. audiostream_connect_pipeline(STREAM_DIR_WRITE, &media->micspkstream->base, NULL);
  525. }
  526. audiostream_connect_pipeline(STREAM_DIR_READ, &media->resizestream->base, &media->codecstream->base, &media->rtpstream->base, NULL);
  527. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_LEFT, &media->micspkstream->base);
  528. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_RIGHT, &media->resizestream->base);
  529. }
  530. else
  531. {
  532. if (media->dspstream)
  533. {
  534. audiostream_connect_pipeline(STREAM_DIR_BOTH, &media->micspkstream->base, &media->dspstream->base, NULL);
  535. }
  536. else
  537. {
  538. audiostream_connect_pipeline(STREAM_DIR_BOTH, &media->micspkstream->base, NULL);
  539. }
  540. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_LEFT, &media->micspkstream->base);
  541. audiostream_connect_pipeline(STREAM_DIR_BOTH, &media->resizestream->base, &media->codecstream->base, &media->rtpstream->base, NULL);
  542. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_RIGHT, &media->resizestream->base);
  543. }
  544. status = audiocontext_create(media->pool, media->engine, &media->context);
  545. if (status != APR_SUCCESS){
  546. LogWarn(Severity_Middle, Error_Debug, ERROR_MOD_SIP_AUDIO_CONTEXT_CREATE_FAILED, "create audio context failed!");
  547. goto on_error;
  548. }
  549. audiocontext_add_driver(media->context, &media->bridge->base);
  550. audioengine_start_context(media->engine, media->context);
  551. return 0;
  552. on_error:
  553. phonemedia_stop(media, TRUE);
  554. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("phonemedia_stop error!!!");
  555. return Error_Resource;
  556. }
  557. static int phonemedia_stop(audio_session_t *session, int b_record_turn_off)
  558. {
  559. audio_session_t *media = session;
  560. if (media->context) {
  561. audioengine_stop_context(media->engine, media->context);
  562. audiocontext_remove_driver(media->context, &media->bridge->base);
  563. audiocontext_destroy(media->context);
  564. media->context = NULL;
  565. }
  566. if (media->engine) {
  567. audioengine_stop(media->engine);
  568. audioengine_destroy(media->engine);
  569. media->engine = NULL;
  570. }
  571. if (media->bridge) {
  572. audiobridge_destroy(media->bridge);
  573. media->bridge = NULL;
  574. }
  575. if (media->resizestream) {
  576. audioresize_destroy(media->resizestream);
  577. media->resizestream = NULL;
  578. }
  579. if (media->codecstream) {
  580. audiocodec_destroy(media->codecstream);
  581. media->codecstream = NULL;
  582. }
  583. if (media->rtpstream) {
  584. audiortp_destroy(media->rtpstream);
  585. media->rtpstream = NULL;
  586. }
  587. if (media->rtpsess) {
  588. unsigned short ilocal_port = 0;
  589. rtp_session_get_local_rtp_port(media->rtpsess, &ilocal_port);
  590. rtp_session_destroy(media->rtpsess);
  591. {
  592. LogWarn(Severity_Low, Error_Debug, EVENT_MOD_SIP_AUDIO_RTP_DESTROY, CSimpleStringA::Format("audio rtp(media->rtpsess) destroy and local port is %u.", ilocal_port).GetData());
  593. }
  594. media->rtpsess = NULL;
  595. }
  596. if (media->dspstream) {
  597. audiodsp_destroy(media->dspstream);
  598. media->dspstream = NULL;
  599. }
  600. if (media->micspkstream) {
  601. audiomicspk2_destroy(media->micspkstream);
  602. media->micspkstream = NULL;
  603. apr_pool_destroy(media->micspk_pool);
  604. media->micspk_pool = NULL;
  605. }
  606. if (media->pool) {
  607. apr_pool_destroy(media->pool);
  608. media->pool = NULL;
  609. }
  610. return 0;
  611. }
  612. static int phonemedia_chang_dev(audio_session_t *session, e_dev_type t)
  613. {
  614. audio_session_t *media = session;
  615. audio_session_phonemedia_conf_t *conf = &media->phonemedia_conf;
  616. int opt_micspk;
  617. const char *in_dev;
  618. const char *out_dev;
  619. int in_agc;
  620. int out_agc;
  621. int in_ns;
  622. int out_ns;
  623. int aec;
  624. int istoptype;
  625. in_dev = &session->conf.in_dev[t][0];
  626. out_dev = &session->conf.out_dev[t][0];
  627. in_agc = media->conf.agc_in[t];
  628. out_agc = media->conf.agc_out[t];
  629. in_ns = media->conf.ns_in[t];
  630. out_ns = media->conf.ns_out[t];
  631. aec = media->conf.aec[t];
  632. istoptype = media->conf.istoptype;
  633. opt_micspk = AMS_OPT_AS_STREAM;
  634. if (conf->dir & DIR_TX) {
  635. opt_micspk |= AMS_OPT_PLAY;
  636. }
  637. if (conf->dir & DIR_RX) {
  638. opt_micspk |= AMS_OPT_RECORD;
  639. }
  640. if (media->pool) {
  641. //apr_status_t status;
  642. audiocontext_remove_driver(media->context, &media->bridge->base);
  643. if (media->micspkstream) {
  644. audiomicspk2_destroy(media->micspkstream);
  645. media->micspkstream = NULL;
  646. }
  647. if (media->dspstream) {
  648. audiodsp_destroy(media->dspstream);
  649. media->dspstream = NULL;
  650. }
  651. apr_pool_destroy(media->micspk_pool);
  652. apr_pool_create(&media->micspk_pool, media->pool);
  653. if (in_agc)
  654. opt_micspk |= AMS2_OPT_AGC;
  655. if (in_ns)
  656. opt_micspk |= AMS2_OPT_NS;
  657. if (aec)
  658. opt_micspk |= AMS2_OPT_AEC;
  659. audiomicspk2_create(media->micspk_pool, media->engine, opt_micspk, AUDIO_CLOCK, in_dev, out_dev, istoptype, t, &audio_device_event, &media->micspkstream);
  660. media->micspkstream->on_rx_audio = &on_rx_audio;
  661. media->phonemedia_conf.dev_type = t;
  662. if (out_agc || out_ns) {
  663. int read_opt = AUDIO_DSP_NONE;
  664. int write_opt = AUDIO_DSP_NONE;
  665. if (out_agc)
  666. write_opt |= AUDIO_DSP_AGC;
  667. if (out_ns)
  668. write_opt |= AUDIO_DSP_DENOISE;
  669. audiodsp_create(media->micspk_pool, media->engine, read_opt, write_opt, AUDIO_CLOCK, &media->dspstream);
  670. }
  671. if (conf->dir == DIR_TX) {
  672. if (media->dspstream) {
  673. audiostream_connect_pipeline(STREAM_DIR_READ, &media->micspkstream->base, &media->dspstream->base, NULL);
  674. } else {
  675. audiostream_connect_pipeline(STREAM_DIR_READ, &media->micspkstream->base, NULL);
  676. }
  677. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_LEFT, &media->micspkstream->base);
  678. audiostream_connect_pipeline(STREAM_DIR_WRITE, &media->resizestream->base, &media->codecstream->base, &media->rtpstream->base, NULL);
  679. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_RIGHT, &media->resizestream->base);
  680. } else if (conf->dir == DIR_RX) {
  681. if (media->dspstream) {
  682. audiostream_connect_pipeline(STREAM_DIR_WRITE, &media->micspkstream->base, &media->dspstream->base, NULL);
  683. } else {
  684. audiostream_connect_pipeline(STREAM_DIR_WRITE, &media->micspkstream->base, NULL);
  685. }
  686. audiostream_connect_pipeline(STREAM_DIR_READ, &media->resizestream->base, &media->codecstream->base, &media->rtpstream->base, NULL);
  687. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_LEFT, &media->micspkstream->base);
  688. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_RIGHT, &media->resizestream->base);
  689. } else {
  690. if (media->dspstream) {
  691. audiostream_connect_pipeline(STREAM_DIR_BOTH, &media->micspkstream->base, &media->dspstream->base, NULL);
  692. } else {
  693. audiostream_connect_pipeline(STREAM_DIR_BOTH, &media->micspkstream->base, NULL);
  694. }
  695. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_LEFT, &media->micspkstream->base);
  696. audiostream_connect_pipeline(STREAM_DIR_BOTH, &media->resizestream->base, &media->codecstream->base, &media->rtpstream->base, NULL);
  697. audiobridge_set_leg(media->bridge, AUDIO_BRIDGE_LEG_RIGHT, &media->resizestream->base);
  698. }
  699. audiortp_reset_jitter(media->rtpstream);
  700. audiocontext_add_driver(media->context, &media->bridge->base);
  701. return 0;
  702. } else {
  703. return Error_NotInit;
  704. }
  705. return Error_Unexpect;
  706. }
  707. ///////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
  708. //// audio session
  709. int audio_session_create(const audio_session_conf_t *conf, audio_session_t **p_session)
  710. {
  711. audio_session_t *session = ZALLOC_T(audio_session_t);
  712. session->remoteaudioqueue = new Clibaudioqueue(REC_COMMON_REMOTEAUDIO_SHM_QUEUE);
  713. session->brtpinsertqueue = false;
  714. session->baudiorecved = false;
  715. if (session) {
  716. memcpy(&session->conf, conf, sizeof(audio_session_conf_t));
  717. *p_session = session;
  718. return 0;
  719. } else {
  720. return Error_Resource;
  721. }
  722. }
  723. int audio_session_start_phonemedia(audio_session_t *session, const audio_session_phonemedia_conf_t *conf)
  724. {
  725. int rc;
  726. if (!session)
  727. return Error_NotInit;
  728. if (session->pool) { // already started
  729. phonemedia_stop(session, FALSE);
  730. }
  731. phonemedia_reconfig(session, conf);
  732. rc = phonemedia_start(session);
  733. return rc;
  734. }
  735. int audio_session_change_dev(audio_session_t *session, e_dev_type t)
  736. {
  737. return phonemedia_chang_dev(session, t);
  738. }
  739. int audio_session_stop(audio_session_t *session)
  740. {
  741. return phonemedia_stop(session, TRUE);
  742. }
  743. void audio_session_destroy(audio_session_t *session)
  744. {
  745. if (session->remoteaudioqueue)
  746. {
  747. delete session->remoteaudioqueue;
  748. }
  749. assert(session->pool == NULL);
  750. free(session);
  751. }
  752. ///////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
  753. static void __stdcall __audio_log_func(int level, const char *s)
  754. {
  755. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)(s);
  756. }
  757. //static char* utf8togb2312(const char* utf8)
  758. //{
  759. // int len = MultiByteToWideChar(CP_UTF8, 0, utf8, -1, NULL, 0);
  760. //
  761. // wchar_t* wstr = new wchar_t[len + 1];
  762. // memset(wstr, 0, (len + 1)*sizeof(wchar_t));
  763. //
  764. // MultiByteToWideChar(CP_UTF8, 0, utf8, -1, wstr, len);
  765. // len = WideCharToMultiByte(CP_ACP, 0, wstr, -1, NULL, 0, NULL, NULL);
  766. //
  767. // char* str = new char[len + 1];
  768. // memset(str, 0, (len + 1)*sizeof(char));
  769. //
  770. // WideCharToMultiByte(CP_ACP, 0, wstr, -1, str, len, NULL, NULL);
  771. //
  772. // if (wstr) {
  773. // delete[]wstr;
  774. // wstr = NULL;
  775. // }
  776. // return str;
  777. //}
  778. //
  779. //
  780. //static char* gb2312toutf8(const char* gb2312)
  781. //{
  782. // int len = MultiByteToWideChar(CP_ACP, 0, gb2312, -1, NULL, 0);
  783. // wchar_t* wstr = new wchar_t[len + 1];
  784. // memset(wstr, 0, (len + 1)*sizeof(wchar_t));
  785. //
  786. // MultiByteToWideChar(CP_ACP, 0, gb2312, -1, wstr, len);
  787. // len = WideCharToMultiByte(CP_UTF8, 0, wstr, -1, NULL, 0, NULL, NULL);
  788. //
  789. // char* str = new char[len + 1];
  790. // memset(str, 0, (len + 1)*sizeof(char));
  791. // WideCharToMultiByte(CP_UTF8, 0, wstr, -1, str, len, NULL, NULL);
  792. // if (wstr) {
  793. // delete[] wstr;
  794. // wstr = NULL;
  795. // }
  796. // return str;
  797. //}
  798. int audio_lib_init()
  799. {
  800. audio_log_set_func(&__audio_log_func);
  801. int rc = audioframework_init();
  802. if (rc != 0) {
  803. return Error_Resource;
  804. } else {
  805. int icnt, ocnt;
  806. audio_log_set_func(NULL);
  807. rc = audio_get_dev_count(&icnt, &ocnt);
  808. if (rc == 0) {
  809. int i;
  810. CSimpleStringA strJsonIn;
  811. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("audio input devices(%d):", icnt);
  812. for (i = 0; i < icnt; ++i) {
  813. CSimpleStringA str = audio_get_dev_name(true, i);
  814. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("%d = %s", i, str.GetData());
  815. strJsonIn += CSimpleStringA::Format("\"%d\":\"%s\",", i, str.GetData());
  816. }
  817. if (strJsonIn.GetLength() > 0) {
  818. strJsonIn[strJsonIn.GetLength() - 1] = '\0';
  819. }
  820. CSimpleStringA strJsonInData = CSimpleStringA::Format("audio in devices [{%s}]", strJsonIn.GetData());
  821. LogWarn(Severity_Low, Error_Debug, LOG_EVT_SIPPHONE_GET_AUDIO_IN_INFOS, strJsonInData.GetData());
  822. CSimpleStringA strJsonOut;
  823. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("audio output devices(%d):", ocnt);
  824. for (i = 0; i < ocnt; ++i) {
  825. CSimpleStringA str = audio_get_dev_name(false, i);
  826. DbgWithLink(LOG_LEVEL_INFO, LOG_TYPE_SYSTEM)("%d = %s", i, str.GetData());
  827. strJsonOut += CSimpleStringA::Format("\"%d\":\"%s\",", i, str.GetData());
  828. }
  829. if (strJsonOut.GetLength() > 0) {
  830. strJsonOut[strJsonOut.GetLength() - 1] = '\0';
  831. }
  832. CSimpleStringA strJsonOutData = CSimpleStringA::Format("audio out devices [{%s}]", strJsonOut.GetData());
  833. LogWarn(Severity_Low, Error_Debug, LOG_EVT_SIPPHONE_GET_AUDIO_OUT_INFOS, strJsonOutData.GetData());
  834. }
  835. audio_log_set_func(&__audio_log_func);
  836. }
  837. return 0;
  838. }
  839. void audio_lib_deinit()
  840. {
  841. audioframework_term();
  842. }
  843. int audio_get_dev_count(int *in_cnt, int *out_cnt)
  844. {
  845. int icnt = 0, ocnt = 0;
  846. int cnt = Pa_GetDeviceCount();
  847. for (int i = 0; i < cnt; ++i) {
  848. const PaDeviceInfo *info = Pa_GetDeviceInfo(i);
  849. if (info->maxInputChannels)
  850. icnt ++;
  851. if (info->maxOutputChannels)
  852. ocnt ++;
  853. }
  854. if (in_cnt)
  855. *in_cnt = icnt;
  856. if (out_cnt)
  857. *out_cnt = ocnt;
  858. return 0;
  859. }
  860. CSimpleStringA audio_get_dev_name(bool in_direction, int idx)
  861. {
  862. audio_log_set_func(NULL);
  863. int cnt = Pa_GetDeviceCount();
  864. int ii, i;
  865. for (i = 0, ii = 0; i < cnt; ++i) {
  866. const PaDeviceInfo *info = Pa_GetDeviceInfo(i);
  867. if (in_direction) {
  868. if (info->maxInputChannels) {
  869. if (idx == ii) {
  870. CSimpleStringA strInDevice = CSimpleStringA(info->name);
  871. return strInDevice;
  872. }
  873. ii++;
  874. }
  875. } else {
  876. if (info->maxOutputChannels) {
  877. if (idx == ii) {
  878. CSimpleStringA strOutDevice = CSimpleStringA(info->name);
  879. return strOutDevice;
  880. }
  881. ii++;
  882. }
  883. }
  884. }
  885. return CSimpleStringA();
  886. }
  887. int capture_get_audio_device_id(bool in_direction, const char *dev_name)
  888. {
  889. if (NULL == dev_name) {
  890. return -1;
  891. }
  892. int cnt = Pa_GetDeviceCount();
  893. int ii, i;
  894. for (i = 0, ii = 0; i < cnt; ++i) {
  895. const PaDeviceInfo *info = Pa_GetDeviceInfo(i);
  896. if (in_direction) {
  897. if (info->maxInputChannels) {
  898. if (strstr(info->name, dev_name) != NULL) {
  899. return ii;
  900. }
  901. ii++;
  902. }
  903. }
  904. else {
  905. if (info->maxOutputChannels) {
  906. if (strstr(info->name, dev_name) != NULL) {
  907. return ii;
  908. }
  909. ii++;
  910. }
  911. }
  912. }
  913. return -1;
  914. }