Leaked source code of windows server 2003
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

844 lines
31 KiB

  1. #include <stdio.h>
  2. #include <stdlib.h>
  3. #include "sdstruct.h"
  4. #include "sdstuff.h"
  5. #include "tabl_ns.h"
  6. #include <math.h>
  7. /**************************************************************
  8. ***************************************************************
  9. ***************************************************************
  10. ***************************************************************
  11. Silence Detection subroutines
  12. Mark R. Walker, 5/95
  13. Copyright Intel Inc., 1995
  14. ***************************************************************
  15. ***************************************************************
  16. ***************************************************************/
  17. /************************************************************************************************/
  18. /************************************************************************************************/
  19. /******* get_params ************/
  20. /************************************************************************************************/
  21. /************************************************************************************************/
  22. /* This subroutine computes the parameters used by the classifier to determine
  23. whether the current frame is silent*/
  24. #if PLOTFILE
  25. void getParams(INSTNCE *SD_inst, float *inbuff, int buffersize, float *p1, float *p2, float *p3)
  26. #else
  27. void getParams(INSTNCE *SD_inst, float *inbuff, int buffersize)
  28. #endif
  29. {
  30. int M, p, i, q, offset, index;
  31. float *buffptr,R[12];
  32. float gamma, delta, L[50], E[12];
  33. float alpha0;
  34. float Energy;
  35. float epsilon = 0.00001f;
  36. M = 6;
  37. buffptr = inbuff;
  38. offset = M;
  39. for(i=0; i<(M-1)*(M-1); i++) L[i] = 0.0f;
  40. Energy = DotProdSD(buffptr, buffptr, buffersize)/buffersize;
  41. /* Compute autocorrelation coeffs. */
  42. for(q=0; q<=M; q++) R[q] = DotProdSD(buffptr, buffptr+q, buffersize-q);
  43. for(i=0; i<=M; i++) R[i] = Binomial80[i]*R[i];
  44. /* Compute first linear predictor */
  45. L[0] = 1.0f;
  46. E[0] = R[0];
  47. /* Forward Levinson's recursion */
  48. for(p=1;p<=M;p++)
  49. {
  50. for(delta=0.0f, i=0;i<p;i++) delta += R[i+1]*L[(p-1)*offset + i];
  51. if (E[p-1]!=0.0) gamma = delta / E[p-1];
  52. else gamma = epsilon;
  53. L[p*offset+0] = -gamma;
  54. for(i=1;i<p;i++) L[p*offset + i] = L[(p-1)*offset + i-1] - gamma*L[(p-1)*offset + p-1-i];
  55. L[p*offset + p] = 1.0f;
  56. E[p] = E[p-1] * (1.0f-gamma*gamma);
  57. }
  58. alpha0 = -L[33];
  59. /* Load the calculated parameters into the SD data structure */
  60. /* Zero crossings */
  61. SD_inst->SDstate.FrameZCs = (float) zeroCross(inbuff, buffersize)/buffersize;
  62. /* Frame energy */
  63. if(Energy!=0.0f)
  64. SD_inst->SDstate.FrameEnergy = (float)(20.0f*log10(Energy));
  65. else {
  66. index = (SD_inst->SDFlags & MASK_SQUELCH) >> 8;
  67. SD_inst->SDstate.FrameEnergy = Squelch[index] - 9.0f
  68. + SD_inst->SDstate.SDsettings.Energy_on
  69. + SD_inst->SDstate.Mode0Ptr->Energy.Stdev;
  70. }
  71. /* First linear predictor */
  72. SD_inst->SDstate.FrameLinPred = 100.0f*alpha0;
  73. #if PLOTFILE
  74. *p1 = SD_inst->SDstate.FrameZCs;
  75. *p2 = SD_inst->SDstate.FrameEnergy;
  76. *p3 = SD_inst->SDstate.FrameLinPred;
  77. #endif
  78. //end
  79. }
  80. /************************************************************************************************/
  81. /************************************************************************************************/
  82. /******* glblSDinitialize ************/
  83. /************************************************************************************************/
  84. /************************************************************************************************/
  85. /* This routine is called once per session for setting global values needed for silence */
  86. /* detection. */
  87. /************************************************************************************************/
  88. /************************************************************************************************/
  89. void glblSDinitialize(INSTNCE *SD_inst)
  90. {
  91. int i, index, histSize, tauHistSize;
  92. float squelch_level;
  93. /* Set the mode pointers pointing to the mode structures - initially */
  94. SD_inst->SDstate.Mode0Ptr = &(SD_inst->SDstate.Mode0);
  95. SD_inst->SDstate.Mode1Ptr = &(SD_inst->SDstate.Mode1);
  96. /* set history sizes based on buffersize, passed in from minifilter shell*/
  97. SD_inst->SDstate.SDsettings.BufferSize = BUFFERSIZE;
  98. histSize = SD_inst->SDstate.SDsettings.HistSize = HIST_SIZE;
  99. tauHistSize = SD_inst->SDstate.SDsettings.TauHistSize = ENERGY_TAU_HIST_SIZE;
  100. SD_inst->SDstate.SDsettings.MinStartupCount = (int)(MIN_STARTUP_TIME*8000.0/BUFFERSIZE);
  101. SD_inst->SDstate.SDsettings.MaxStartupCount = (int)(MAX_STARTUP_TIME*8000.0/BUFFERSIZE);
  102. SD_inst->SDstate.SDsettings.MaxSpeechFrameCount = (int)(MAX_SPEECH_TIME*8000.0/BUFFERSIZE);
  103. /* set silent/sound frame designation initially to silent */
  104. /* Class = 1, silent frame
  105. Class = 0, non-silent */
  106. SD_inst->SDstate.Class = 1;
  107. /*set silence detetction initally disabled */
  108. /* SD_enable =0, silence detection disabled - SD_initialize executes
  109. SD_enable =1, silence detection enabled */
  110. SD_inst->SDstate.SD_enable = 0;
  111. /* The flags should be set in the minifilter audio format */
  112. //SD_inst->SDFlags = 0;
  113. //SD_inst->SDFlags |= MASK_SD_ENABLE; /* set enable bit by default */
  114. /*The energy squelch level is acquired by unmasking some of
  115. the bits in SDFlags */
  116. index = (SD_inst->SDFlags & MASK_SQUELCH) >> 8;
  117. squelch_level = Squelch[index];
  118. SD_inst->SDstate.SDsettings.Squelch_set = squelch_level;
  119. /*
  120. *Tau distributions initial values. Tau is is the distance between the mean silent energy (mode 0),
  121. and the mean speech energy (mode 1). It is only used in SD_initialize.
  122. */
  123. /*TauStdev is used in SD_initialize to decide when to quit initializing*/
  124. SD_inst->SDstate.TauMode.TauEnergy.TauStdev = (float)INITL_STOPPING_STDEV;
  125. /*Minimum acceptable Tau value used in SD_initialize to decide if silence detection is possible*/
  126. SD_inst->SDstate.SDsettings.Energy_MinTau = (float)INITL_MIN_TAU;
  127. for (i=0;i<tauHistSize;i++) SD_inst->SDstate.TauMode.TauEnergy.TauHistory[i] = 0.0f;
  128. /*Mode 0 & 1 distribution initial values. Mode 0 is the statistical information for silence.
  129. Mode 1 is the statistical information for speech */
  130. for (i=0;i<histSize;i++)
  131. {
  132. SD_inst->SDstate.Mode1Ptr->Energy.History[i] = 0.0f;
  133. SD_inst->SDstate.Mode0Ptr->Energy.History[i] = 0.0f;
  134. SD_inst->SDstate.Mode0Ptr->Alpha1.History[i] = 0.0f;
  135. SD_inst->SDstate.Mode0Ptr->ZC.History[i] = 0.0f;
  136. }
  137. /*set initial frame counts*/
  138. /*initFrameCount is only used to count frames in SD_initialize
  139. The Mode 0 and Mode 1 counters count continuous runs of
  140. silent and non-silent frames, resepctively.
  141. They are used in both SD_initialize and the main GSM encoder loop */
  142. SD_inst->SDstate.initFrameCount = 0;
  143. SD_inst->SDstate.Mode0Ptr->FrameCount=0;
  144. SD_inst->SDstate.Mode1Ptr->FrameCount=0;
  145. /*Mode 1 (speech) initial values*/
  146. SD_inst->SDstate.Mode1Ptr->Energy.Mean = squelch_level + 10.0f;
  147. SD_inst->SDstate.Mode1Ptr->Energy.Stdev = 1.0f;
  148. /*Mode 0 (silence) initial values*/
  149. SD_inst->SDstate.Mode0Ptr->Energy.Mean = squelch_level - 10.0f;
  150. SD_inst->SDstate.Mode0Ptr->Energy.Stdev = 1.0f;
  151. SD_inst->SDstate.Mode0Ptr->Alpha1.Mean = 0.0f;
  152. SD_inst->SDstate.Mode0Ptr->Alpha1.Stdev = 0.0f;
  153. SD_inst->SDstate.Mode0Ptr->ZC.Mean = 0.0f;
  154. SD_inst->SDstate.Mode0Ptr->ZC.Stdev = 0.0f;
  155. /* class = 0 = speech frame = "off"
  156. /* class = 1 = silent frame = "on"
  157. /*"On" thresholds used by silence_detect and SD_initialize.
  158. These values either multiply or are added to the standard
  159. deviation of each of the three stat types.
  160. Making these values smaller makes the range of values
  161. smaller, and thus makes the transition from speech
  162. frame designation (Class=0) to silent frame designation (Class=1)
  163. less likely */
  164. SD_inst->SDstate.SDsettings.Energy_on =INITL_ENERGY_ON;
  165. SD_inst->SDstate.SDsettings.ZC_on =INITL_ZC_ON;
  166. SD_inst->SDstate.SDsettings.Alpha1_on =INITL_ALPHA_ON;
  167. SD_inst->SDstate.HangCntr = 0;
  168. /*"Off" thresholds used by silence_detect.
  169. These values either multiply or are added to the standard
  170. deviation of each of the three stat types.
  171. Making these values smaller makes the transition from silent
  172. frame designation (Class=1) to speech frame designation (Class=0)
  173. harder, less likely */
  174. SD_inst->SDstate.SDsettings.Energy_off =INITL_ENERGY_OFF;
  175. SD_inst->SDstate.SDsettings.ZC_off =INITL_ZC_OFF;
  176. SD_inst->SDstate.SDsettings.Alpha1_off =INITL_ALPHA_OFF;
  177. /* Initialize circular buffers for prefiltering operations */
  178. for(i=0;i<4;i++) SD_inst->SDstate.Filt.nBuffer[i]=0.0f;
  179. for(i=0;i<3;i++) SD_inst->SDstate.Filt.dBuffer[i]=0.0f;
  180. for(i=0;i<6;i++){
  181. SD_inst->SDstate.Filt.denom[i]=0.0f;
  182. SD_inst->SDstate.Filt.num[i]=0.0f;
  183. }
  184. }/*End global initalize SD*/
  185. /***********************************************************************************************/
  186. /************************************************************************************************/
  187. /******* silenceDetect ************/
  188. /************************************************************************************************/
  189. /************************************************************************************************/
  190. /* Mark R. Walker
  191. Copyright Intel inc., 1995*/
  192. /* Silence_Detect is executed once per frame if silence detection is enabled.
  193. It employs three vocoder parameters (energy, zero crossings, first predictor)
  194. to determine if a given frame is speech or background silence.
  195. It returns the resulting frame classification. */
  196. /************************************************************************************************/
  197. /************************************************************************************************/
  198. int silenceDetect(INSTNCE *SD_inst, float Energy_tx, float ZC_tx)
  199. {
  200. int histSize, adaptEnable, i, Class;
  201. float Alpha1_val, Energy_val, Zc_count;
  202. /* set history sizes based on buffersize, passed in from minifilter shell*/
  203. histSize = SD_inst->SDstate.SDsettings.HistSize;
  204. /*
  205. * -------state switch decision criteria -------
  206. *
  207. * Class = 1, frame is silent
  208. * Class = 0, frame is non-silent
  209. */
  210. adaptEnable = TRUE;
  211. Alpha1_val = SD_inst->SDstate.FrameLinPred;
  212. Energy_val = SD_inst->SDstate.FrameEnergy;
  213. Zc_count = SD_inst->SDstate.FrameZCs;
  214. if (Energy_val <= SD_inst->SDstate.Mode0Ptr->Energy.Mean)
  215. /* if current frame Energy_val <= mode0 energy mean, this is definitely a silent frame*/
  216. {
  217. /* In this case, do no further testing of the frame class */
  218. SD_inst->SDstate.Class = SILENCE;
  219. /* If the current frame energy is too low, this frame may be an
  220. outlier with respect to the silence statistics. Test and
  221. do not allow adaptation if this is true.
  222. */
  223. if(Energy_val < (SD_inst->SDstate.Mode0Ptr->Energy.Mean - 2.0*(SD_inst->SDstate.Mode0Ptr->Energy.Stdev)))
  224. adaptEnable = FALSE;
  225. }
  226. else /* else test the frame class */
  227. {
  228. SD_inst->SDstate.Class = classify(Energy_val,Alpha1_val,Zc_count,
  229. SD_inst->SDstate.Mode0Ptr->Energy.Mean, SD_inst->SDstate.Mode0Ptr->Energy.Stdev,
  230. SD_inst->SDstate.Mode0Ptr->Alpha1.Mean, SD_inst->SDstate.Mode0Ptr->Alpha1.Stdev,
  231. SD_inst->SDstate.Mode0Ptr->ZC.Mean, SD_inst->SDstate.Mode0Ptr->ZC.Stdev,
  232. SD_inst->SDstate.Class,
  233. Energy_tx, ZC_tx, SD_inst);
  234. }
  235. /* ------- update statistics-------
  236. *
  237. * if frame class is silent, update silence stats only
  238. */
  239. if ((SD_inst->SDstate.Class!=SPEECH) && (SD_inst->SDstate.Class!=NONADAPT) && (adaptEnable==TRUE))
  240. {
  241. /* ------- update history arrays-------
  242. */
  243. for(i=histSize-1; i>=1; i--)
  244. {
  245. SD_inst->SDstate.Mode0Ptr->Alpha1.History[i] = SD_inst->SDstate.Mode0Ptr->Alpha1.History[i-1];
  246. SD_inst->SDstate.Mode0Ptr->Energy.History[i] = SD_inst->SDstate.Mode0Ptr->Energy.History[i-1];
  247. SD_inst->SDstate.Mode0Ptr->ZC.History[i] = SD_inst->SDstate.Mode0Ptr->ZC.History[i-1];
  248. }
  249. /* ------- first linear predictor -------
  250. */
  251. SD_inst->SDstate.Mode0Ptr->Alpha1.History[0] = Alpha1_val;
  252. update(SD_inst->SDstate.Mode0Ptr->Alpha1.History,histSize,
  253. &(SD_inst->SDstate.Mode0Ptr->Alpha1.Mean),
  254. &(SD_inst->SDstate.Mode0Ptr->Alpha1.Stdev));
  255. /* ------- energy -------
  256. */
  257. SD_inst->SDstate.Mode0Ptr->Energy.History[0] = Energy_val;
  258. update(SD_inst->SDstate.Mode0Ptr->Energy.History,histSize,
  259. &(SD_inst->SDstate.Mode0Ptr->Energy.Mean),
  260. &(SD_inst->SDstate.Mode0Ptr->Energy.Stdev));
  261. /* ------- zero crossing -------
  262. */
  263. SD_inst->SDstate.Mode0Ptr->ZC.History[0] = Zc_count;
  264. update(SD_inst->SDstate.Mode0Ptr->ZC.History,histSize,
  265. &(SD_inst->SDstate.Mode0Ptr->ZC.Mean),
  266. &(SD_inst->SDstate.Mode0Ptr->ZC.Stdev));
  267. }
  268. if(SD_inst->SDstate.Class == NONADAPT)
  269. Class = SILENCE;
  270. else Class = SD_inst->SDstate.Class;
  271. return(Class); /*return frame classification*/
  272. } /*end silenceDetect*/
  273. /************************************************************************************************/
  274. /************************************************************************************************/
  275. /******* initializeSD ************/
  276. /************************************************************************************************/
  277. /************************************************************************************************/
  278. /* Mark R. Walker
  279. Copyright Intel inc., 1995*/
  280. /* initializeSD is executed once per frame prior to the enabling of silence detection.
  281. It employs three vocoder parameters (energy, zero crossings, first predictor)
  282. to determine if a given frame is speech or background silence.
  283. The first part simply fills all of the Mode 0 history arrays and the Mode 1
  284. energy history arrays with values.
  285. The second part of SD_Initialize can take no less than MIN_STARTUP frames, and no more than
  286. MAX_STARTUP frames.
  287. Initalization ends when the standard deviation of the distance between the Mode 0 mean
  288. (silence) and the Mode 1 mean (speech) drops below STOPPING_STDEV.
  289. When the second part of the subroutine has completed, two tests are performed before silence
  290. detection is enabled. First, the distance between the Mode 0 and Mode 1 energy means must be
  291. greater than or equal to Energy_MinTau. Second, the energy "on" threshold must be less
  292. than the energy squelch level. */
  293. /************************************************************************************************/
  294. /************************************************************************************************/
  295. /*-------------------------------------------------------------------------------------------------------------------
  296. */
  297. int initializeSD(INSTNCE *SD_inst)
  298. {
  299. int SD_enable, i, j;
  300. int mode1HistSize, mode0HistSize;
  301. int bufferSize, histSize, tauHistSize, minFrameCount, maxFrameCount;
  302. float Energy_tau, squelch_level;
  303. float Alpha1_val, Energy_val, Zc_count;
  304. STATS TempPtr;
  305. SD_inst->SDstate.initFrameCount++;
  306. Alpha1_val = SD_inst->SDstate.FrameLinPred;
  307. Energy_val = SD_inst->SDstate.FrameEnergy;
  308. Zc_count = SD_inst->SDstate.FrameZCs;
  309. /* set local values of history size */
  310. bufferSize = SD_inst->SDstate.SDsettings.BufferSize;
  311. histSize = SD_inst->SDstate.SDsettings.HistSize;
  312. /* set local values of min and max frame count */
  313. minFrameCount = SD_inst->SDstate.SDsettings.MinStartupCount;
  314. maxFrameCount = SD_inst->SDstate.SDsettings.MaxStartupCount;
  315. /*First part of SD_Initialize simply fills the history arrays with values */
  316. if(SD_inst->SDstate.initFrameCount < SD_inst->SDstate.SDsettings.TauHistSize)
  317. { tauHistSize = SD_inst->SDstate.initFrameCount;
  318. }
  319. else
  320. { tauHistSize = SD_inst->SDstate.SDsettings.TauHistSize;
  321. }
  322. if (((SD_inst->SDstate.TauMode.TauEnergy.TauStdev > STOPPING_STDEV) || (SD_inst->SDstate.initFrameCount <= minFrameCount)) && (SD_inst->SDstate.initFrameCount <= maxFrameCount))
  323. {
  324. /*-----Select Energy mode decision--------*/
  325. if ((Energy_val < SD_inst->SDstate.Mode0Ptr->Energy.Mean) || (fabs(Energy_val - SD_inst->SDstate.Mode0Ptr->Energy.Mean) < (SD_inst->SDstate.SDsettings.Energy_on + SD_inst->SDstate.Mode0Ptr->Energy.Stdev)))
  326. { /*Energy mode = Mode0 (silence)*/
  327. /*increment mode zero frame counter*/
  328. SD_inst->SDstate.Mode0Ptr->FrameCount++;
  329. if(SD_inst->SDstate.Mode0Ptr->FrameCount < histSize)
  330. { mode0HistSize = SD_inst->SDstate.Mode0Ptr->FrameCount;
  331. }
  332. else
  333. { mode0HistSize = histSize;
  334. }
  335. /*update the history arrays*/
  336. for (i=mode0HistSize-1; i>=1; i--)
  337. {
  338. SD_inst->SDstate.Mode0Ptr->Alpha1.History[i] = SD_inst->SDstate.Mode0Ptr->Alpha1.History[i-1];
  339. SD_inst->SDstate.Mode0Ptr->Energy.History[i] = SD_inst->SDstate.Mode0Ptr->Energy.History[i-1];
  340. SD_inst->SDstate.Mode0Ptr->ZC.History[i] = SD_inst->SDstate.Mode0Ptr->ZC.History[i-1];
  341. }
  342. /*load new frame values into history arrays and update statistics */
  343. SD_inst->SDstate.Mode0Ptr->Energy.History[0] = Energy_val;
  344. update(SD_inst->SDstate.Mode0Ptr->Energy.History,mode0HistSize,&(SD_inst->SDstate.Mode0Ptr->Energy.Mean),&(SD_inst->SDstate.Mode0Ptr->Energy.Stdev));
  345. SD_inst->SDstate.Mode0Ptr->Alpha1.History[0] = Alpha1_val;
  346. update(SD_inst->SDstate.Mode0Ptr->Alpha1.History,mode0HistSize,&(SD_inst->SDstate.Mode0Ptr->Alpha1.Mean),&(SD_inst->SDstate.Mode0Ptr->Alpha1.Stdev));
  347. SD_inst->SDstate.Mode0Ptr->ZC.History[0] = Zc_count;
  348. update(SD_inst->SDstate.Mode0Ptr->ZC.History,mode0HistSize,&(SD_inst->SDstate.Mode0Ptr->ZC.Mean),&(SD_inst->SDstate.Mode0Ptr->ZC.Stdev));
  349. }
  350. else /*Energy mode = 1 (speech) - Update Mode1 energy statistics only*/
  351. {
  352. /*increment mode 1 frame counter*/
  353. SD_inst->SDstate.Mode1Ptr->FrameCount++;
  354. if(SD_inst->SDstate.Mode1Ptr->FrameCount < histSize)
  355. { mode1HistSize = SD_inst->SDstate.Mode1Ptr->FrameCount;
  356. }
  357. else
  358. { mode1HistSize = histSize;
  359. }
  360. /*update the history array*/
  361. for (i=mode1HistSize-1; i>=1; i--) SD_inst->SDstate.Mode1Ptr->Energy.History[i] = SD_inst->SDstate.Mode1Ptr->Energy.History[i-1];
  362. /*load new frame values into history arrays and update statistics */
  363. SD_inst->SDstate.Mode1Ptr->Energy.History[0]= Energy_val;
  364. update(SD_inst->SDstate.Mode1Ptr->Energy.History,mode1HistSize,&(SD_inst->SDstate.Mode1Ptr->Energy.Mean),&(SD_inst->SDstate.Mode1Ptr->Energy.Stdev));
  365. }
  366. /* ---------------------- Compute Tau -------------------------------- */
  367. /* Tau is the difference between the Mode0 and Mode1 mean energy values */
  368. Energy_tau = (float)fabs(SD_inst->SDstate.Mode0Ptr->Energy.Mean - SD_inst->SDstate.Mode1Ptr->Energy.Mean);
  369. /* ---------------------- Update Tau history -------------------------- */
  370. for (i=tauHistSize-1; i>=1; i--) SD_inst->SDstate.TauMode.TauEnergy.TauHistory[i] = SD_inst->SDstate.TauMode.TauEnergy.TauHistory[i-1];
  371. SD_inst->SDstate.TauMode.TauEnergy.TauHistory[0]= Energy_tau;
  372. update(SD_inst->SDstate.TauMode.TauEnergy.TauHistory,tauHistSize,&(SD_inst->SDstate.TauMode.TauEnergy.TauMean),&(SD_inst->SDstate.TauMode.TauEnergy.TauStdev));
  373. /* Now check the energy means.*/
  374. /* The mode with the lowest mean energy is always set to Mode0 (silence)*/
  375. if((SD_inst->SDstate.Mode1Ptr->Energy.Mean) < (SD_inst->SDstate.Mode0Ptr->Energy.Mean))
  376. {
  377. TempPtr = SD_inst->SDstate.Mode0Ptr->Energy;
  378. SD_inst->SDstate.Mode0Ptr->Energy = SD_inst->SDstate.Mode1Ptr->Energy;
  379. SD_inst->SDstate.Mode1Ptr->Energy = TempPtr;
  380. }
  381. /* We are still initializing - silence detection is disabled */
  382. SD_enable = FALSE;
  383. } /* if TauEnergy.TauStdev > STOPPING_STDEV */
  384. else
  385. {
  386. /* At this point, either Tau stdev has dropped below STOPPING_STDEV, or
  387. we have exceeded MAX_STARTUP */
  388. /* Now decide whether silence / sound discrimination is possible */
  389. /* Get the squelch level from the data structure */
  390. squelch_level = SD_inst->SDstate.SDsettings.Squelch_set;
  391. /* Disable silence detection if TauEnergy.TauMean is less than Energy_MinTau */
  392. /* Disable also if we have never seen a silent frame (Mode0) */
  393. /* Disable also if the difference between the silence energy mean and the squelch level */
  394. /* is less than the "Energy_on" threshold */
  395. if(
  396. ( SD_inst->SDstate.TauMode.TauEnergy.TauMean < SD_inst->SDstate.SDsettings.Energy_MinTau) ||
  397. ( SD_inst->SDstate.Mode0Ptr->FrameCount == 0) ||
  398. ( SD_inst->SDstate.Mode1Ptr->Energy.Mean == squelch_level + 10) ||//This is the initial value
  399. ( fabs((SD_inst->SDstate.Mode0Ptr->Energy.Mean) - squelch_level)
  400. < (SD_inst->SDstate.SDsettings.Energy_on * SD_inst->SDstate.Mode0Ptr->Energy.Stdev))
  401. )
  402. {
  403. SD_enable = FALSE;
  404. }
  405. else
  406. {
  407. SD_enable = TRUE;
  408. }
  409. /* If the Mode0 history arrays are not filled - fill them out by repeating the last value */
  410. if((SD_inst->SDstate.Mode0Ptr->FrameCount !=0) && (SD_inst->SDstate.Mode0Ptr->FrameCount < histSize))
  411. {
  412. j=SD_inst->SDstate.Mode0Ptr->FrameCount;
  413. for(i=j; i<histSize; i++) SD_inst->SDstate.Mode0Ptr->Energy.History[i] = SD_inst->SDstate.Mode0Ptr->Energy.History[j-1];
  414. for(i=j; i<histSize; i++) SD_inst->SDstate.Mode0Ptr->Alpha1.History[i] = SD_inst->SDstate.Mode0Ptr->Alpha1.History[j-1];
  415. for(i=j; i<histSize; i++) SD_inst->SDstate.Mode0Ptr->ZC.History[i] = SD_inst->SDstate.Mode0Ptr->ZC.History[j-1];
  416. SD_inst->SDstate.Mode0Ptr->Energy.Stdev = (float)INITL_STDEV;
  417. }
  418. /* Set all frame counters = 0 */
  419. /* If SD initialization has failed, we are going to start over anyway */
  420. SD_inst->SDstate.initFrameCount=0;
  421. SD_inst->SDstate.Mode0Ptr->FrameCount=0;
  422. SD_inst->SDstate.Mode1Ptr->FrameCount=0;
  423. } /*end if TauEnergy.TauStdev > STOPPING_STDEV */
  424. return(SD_enable);
  425. } /* end initializeSD */
  426. /************************************************************************************************/
  427. /************************************************************************************************/
  428. /******* classify ************/
  429. /************************************************************************************************/
  430. /************************************************************************************************/
  431. /* Mark R. Walker
  432. Copyright Intel inc., 1995
  433. classify is called by Silence_Detect. */
  434. /************************************************************************************************/
  435. /************************************************************************************************/
  436. int classify(float Energy_val,float Alpha1_val,float Zc_count,
  437. float energy_mean,float energy_stdev,float alpha1_mean,
  438. float alpha1_stdev,float ZC_mean,float ZC_stdev,int s,
  439. float Energy_tx, float ZC_tx, INSTNCE *SD_inst)
  440. {
  441. float C1, C2, C3, C4, C5, C6, C7, C8, C9, C10, C11;
  442. int Class;
  443. /* If all decision criteria below do not apply,
  444. just set current frame type to previous frame type */
  445. Class = s;
  446. C1 = (float)fabs(Energy_val - energy_mean);
  447. C3 = (float)fabs(ZC_mean - Zc_count);
  448. C5 = (float)fabs(alpha1_mean - Alpha1_val);
  449. /* Note - Energy "on" threshold is unlike alpha and zero crossing */
  450. C2 = SD_inst->SDstate.SDsettings.Energy_on + energy_stdev;
  451. C10= Energy_tx + energy_stdev;
  452. C4 = SD_inst->SDstate.SDsettings.ZC_on * ZC_stdev;
  453. C11= ZC_tx * ZC_stdev;
  454. C6 = SD_inst->SDstate.SDsettings.Alpha1_on * alpha1_stdev;
  455. /* Note - Energy "off" threshold is unlike alpha and zero crossing */
  456. C7 = SD_inst->SDstate.SDsettings.Energy_off + energy_stdev;
  457. C8 = SD_inst->SDstate.SDsettings.ZC_off * ZC_stdev;
  458. C9 = SD_inst->SDstate.SDsettings.Alpha1_off * alpha1_stdev;
  459. if (s==SILENCE || s==NONADAPT) /* "Off" settings */
  460. {
  461. /* Energy criteria for coded-frame designation.
  462. * If energy indicator is above threshold, immediately
  463. * switch from silent mode to coded frame mode. Do no additional tests
  464. */
  465. if (C1 > C10)
  466. {
  467. Class = SPEECH;
  468. }
  469. /* Zero-crossing criteria for coded-frame designation.
  470. * If ZC indicator is high, allow switch to coded
  471. * frame mode only if alpha1 indicator is also high.
  472. */
  473. else
  474. if (C1 > C2)
  475. {
  476. Class = NONADAPT;
  477. }
  478. else
  479. if ((C3 > C11) && (C5 > C6))
  480. {
  481. Class = SPEECH;
  482. }
  483. else
  484. if ((C3 > C4) && (C5 > C6))
  485. {
  486. Class = NONADAPT;
  487. }
  488. }/* "On settings */
  489. /* Only allow transition from coded to silent frame mode only if
  490. * all three statistics are below threshold.
  491. */
  492. else
  493. if ((C5 < C9) && (C1 < C7) && (C3 < C8))
  494. {
  495. Class = SILENCE;
  496. }
  497. return(Class);
  498. } /*end classify*/
  499. /************************************************************************************************/
  500. /************************************************************************************************/
  501. /******* update ************/
  502. /************************************************************************************************/
  503. /************************************************************************************************/
  504. /* Mark R. Walker
  505. Copyright Intel inc., 1995*/
  506. /************************************************************************************************/
  507. /************************************************************************************************/
  508. void update(float *hist_array,int hist_size,float *mean,float *stdev)
  509. {
  510. /*subroutine update
  511. *Mark Walker
  512. *
  513. * inputs: hist_array, hist_size
  514. * outputs: mean, stdev
  515. */
  516. float sum, inv_size;
  517. int i;
  518. sum = 0.0f;
  519. inv_size = 1.0f / ((float)hist_size);
  520. for (i=0; i<hist_size; i++) sum += hist_array[i];
  521. *mean = sum * inv_size;
  522. sum = 0.0f;
  523. for (i=0; i<hist_size; i++) sum += (float)fabs(hist_array[i] - (*mean));
  524. *stdev = sum * inv_size;
  525. } /*end update*/
  526. //compute the zero crossing for an array of floats
  527. //the floats are treated as signed ints (32 bit)
  528. //the sign bits are extracted and adjacent ones xored
  529. //the xored values are accumulated in the result
  530. int zeroCross(float x[], int n)
  531. {
  532. int sgn0, sgn1;
  533. int zc = 0;
  534. int i = 0;
  535. sgn1 = ((int *)x)[0] >> 31; //initialize
  536. for (i = 0; i < n-1; i += 2)
  537. {
  538. sgn0 = ((int *)x)[i] >> 31;
  539. zc += sgn0 ^ sgn1;
  540. sgn1 = ((int *)x)[i+1] >> 31;
  541. zc += sgn0 ^ sgn1;
  542. }
  543. if (i == n-1) //odd case?
  544. {
  545. sgn0 = ((int *)x)[i] >> 31;
  546. zc += sgn0 ^ sgn1;
  547. }
  548. return -zc;
  549. }
  550. void prefilter(INSTNCE *SD_inst, float *sbuf, float *fbuf, int buffersize)
  551. {
  552. float *nBuffer, *dBuffer,*denom, *num;
  553. float x,recip;
  554. int i;
  555. nBuffer = SD_inst->SDstate.Filt.nBuffer;
  556. dBuffer = SD_inst->SDstate.Filt.dBuffer;
  557. denom = SD_inst->SDstate.Filt.denom;
  558. num = SD_inst->SDstate.Filt.num;
  559. recip = (float)(1.0/MAX_SAMPLE);
  560. for (i=0; i<buffersize; i++)
  561. {
  562. nBuffer[0] = nBuffer[1];
  563. nBuffer[1] = nBuffer[2];
  564. nBuffer[2] = nBuffer[3];
  565. nBuffer[3] = sbuf[i]*recip;
  566. x = nBuffer[0]*HhpNumer[3] +
  567. nBuffer[1]*HhpNumer[2] +
  568. nBuffer[2]*HhpNumer[1] +
  569. nBuffer[3]*HhpNumer[0] +
  570. dBuffer[0]*HhpDenom[2] +
  571. dBuffer[1]*HhpDenom[1] +
  572. dBuffer[2]*HhpDenom[0];
  573. dBuffer[0] = dBuffer[1];
  574. dBuffer[1] = dBuffer[2];
  575. dBuffer[2] = x;
  576. /* a low pass filter to cut off input speech frequency contents
  577. beyond 3.5 kHz */
  578. //Update FIR memory
  579. num[5] = num[4];
  580. num[4] = num[3];
  581. num[3] = num[2];
  582. num[2] = num[1];
  583. num[1] = num[0];
  584. num[0] = x;
  585. x = num[0]*B[0] +
  586. num[1]*B[1] +
  587. num[2]*B[2] +
  588. num[3]*B[3] +
  589. num[4]*B[4] +
  590. num[5]*B[5] +
  591. denom[0]*A[1] +
  592. denom[1]*A[2] +
  593. denom[2]*A[3] +
  594. denom[3]*A[4] +
  595. denom[4]*A[5];
  596. //Update IIR memory
  597. denom[4] = denom[3];
  598. denom[3] = denom[2];
  599. denom[2] = denom[1];
  600. denom[1] = denom[0];
  601. denom[0] = x;
  602. fbuf[i] = x;
  603. }
  604. return;
  605. }
  606. void execSDloop(INSTNCE *SD_inst, int *frameType, float sliderInput)
  607. {
  608. float squelch, e0mean, e0stdev, e_on;
  609. float Energy_tx, ZC_tx;
  610. int m1count, maxcount, hangtime;
  611. //Slider input
  612. if(sliderInput > SLIDER_MAX)
  613. sliderInput = SLIDER_MAX;
  614. else if(sliderInput < SLIDER_MIN)
  615. sliderInput = SLIDER_MIN;
  616. Energy_tx = INITL_ENERGY_ON + sliderInput;
  617. ZC_tx = INITL_ZC_ON + ZC_SLOPE * sliderInput;
  618. hangtime = INITL_HANGTIME + (int)(HANG_SLOPE * sliderInput);
  619. if ( ! SD_inst->SDstate.SD_enable) //run the initializer until SD_enable is set
  620. {
  621. SD_inst->SDstate.SD_enable = initializeSD(SD_inst);
  622. *frameType = SPEECH;
  623. SD_inst->SDstate.Class = SPEECH;
  624. }
  625. else if (SD_inst->SDstate.SD_enable )
  626. {
  627. *frameType = silenceDetect(SD_inst,Energy_tx,ZC_tx);
  628. if(*frameType == SILENCE)
  629. {
  630. if( (SD_inst->SDstate.Mode0Ptr->FrameCount==0)
  631. && (SD_inst->SDstate.Mode1Ptr->FrameCount>MIN_SPEECH_INTERVAL)
  632. && (SD_inst->SDstate.HangCntr != 0) )
  633. {
  634. SD_inst->SDstate.HangCntr--;
  635. *frameType = SPEECH; //force this frame to be coded
  636. }
  637. else if (SD_inst->SDstate.HangCntr == hangtime || SD_inst->SDstate.HangCntr == 0)
  638. {
  639. SD_inst->SDstate.Mode0Ptr->FrameCount++;
  640. SD_inst->SDstate.Mode1Ptr->FrameCount=0;
  641. SD_inst->SDstate.HangCntr = hangtime;
  642. }
  643. }
  644. else
  645. {
  646. if(SD_inst->SDstate.HangCntr != hangtime)
  647. SD_inst->SDstate.Mode1Ptr->FrameCount=0;
  648. SD_inst->SDstate.Mode1Ptr->FrameCount++;
  649. SD_inst->SDstate.Mode0Ptr->FrameCount=0;
  650. SD_inst->SDstate.HangCntr = hangtime;
  651. }
  652. /*
  653. If the adaptive threshold for switching from silence to coded frame ("Off")
  654. has risen above the squelch level, re-initialization will occur on the next frame.
  655. Re-initialization will also occur when the Mode1FrameCount (continuous non-silent frame count)
  656. exceeds 4 seconds.
  657. */
  658. squelch = SD_inst->SDstate.SDsettings.Squelch_set;
  659. e0mean = SD_inst->SDstate.Mode0Ptr->Energy.Mean;
  660. e0stdev = SD_inst->SDstate.Mode0Ptr->Energy.Stdev;
  661. e_on = SD_inst->SDstate.SDsettings.Energy_on;
  662. m1count = SD_inst->SDstate.Mode1Ptr->FrameCount;
  663. maxcount= SD_inst->SDstate.SDsettings.MaxSpeechFrameCount;
  664. if ((fabs(e0mean - squelch) < (e_on + e0stdev)) || (m1count >= maxcount))
  665. { /* reinitialization will occur on next frame - reset global values now */
  666. SD_inst->SDstate.SD_enable = FALSE;
  667. SD_inst->SDstate.Mode0Ptr->FrameCount=0;
  668. SD_inst->SDstate.Mode1Ptr->FrameCount=0;
  669. SD_inst->SDstate.Mode0Ptr->Energy.Mean = squelch;
  670. SD_inst->SDstate.Mode0Ptr->Energy.Stdev = (float) INITL_STDEV;
  671. SD_inst->SDstate.HangCntr = hangtime;
  672. *frameType = SPEECH;
  673. }
  674. }//end if SD_enable
  675. return;
  676. }
  677. float DotProdSD(float *in1, float *in2, int len)
  678. {
  679. int i;
  680. float sum;
  681. sum = (float)0.0;
  682. for (i=0; i<len; i++)
  683. sum += in1[i]*in2[i];
  684. return(sum);
  685. }
  686. __inline unsigned randBit()
  687. {
  688. volatile static unsigned seed = 1;
  689. unsigned bit, temp;
  690. temp = seed;
  691. bit = 1 & ((temp) ^ (temp >> 2) ^ (temp >> 31));
  692. seed = (temp << 1) | bit;
  693. return( bit );
  694. }
  695. extern __inline unsigned short getRand()
  696. {
  697. return (short)(randBit() + (randBit()<<1));
  698. }