<?xml version="1.0" encoding="UTF-8"?>
<doi_batch version="4.3.0" xmlns="http://www.crossref.org/doi_resources_schema/4.3.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.crossref.org/doi_resources_schema/4.3.0 http://www.crossref.org/schema/deposit/doi_resources4.3.0.xsd">
<head>
<doi_batch_id>b7322d75-8a3e-40c5-8964-4211ca337366</doi_batch_id>
<depositor>
<name>beie</name>
<email_address>director@blueeyesintelligence.org</email_address>
</depositor>
</head>
<body>
<doi_citations>
<doi>10.35940/ijitee.D1051.14040325</doi>
<citation_list><citation key="ref0"><doi>10.7176/CEIS/13-3-03</doi><unstructured_citation>S. Alimi and A. Oludele, &quot;Voice Activity Detection: Fusion of Time and Frequency Domain Features with A SVM Classifier,&quot; Comput. Eng. Intell. Syst., vol. 13, no. 3, pp. 20-29, 2022, DOI: https://doi.org/10.7176/CEIS/13-3-03</unstructured_citation></citation><citation key="ref1"><doi>10.3390/electronics12040795</doi><unstructured_citation>M. Faghani, H. Rezaee-Dehsorkh, N. Ravanshad, and H. Aminzadeh, &quot;Ultra-Low-Power Voice Activity Detection System Using Level-Crossing Sampling,&quot; Electron., vol. 12, no. 4, 2023, DOI: https://doi.org/10.3390/electronics12040795</unstructured_citation></citation><citation key="ref2"><doi>10.1109/GlobalSIP45357.2019.8969258</doi><unstructured_citation>H. Krishnakumar and D. S. Williamson, &quot;A comparison of boosted deep neural networks for voice activity detection,&quot; in GlobalSIP 2019 - 7th IEEE Global Conference on Signal and Information Processing, Proceedings, 2019. DOI: https://doi.org/10.1109/GlobalSIP45357.2019.8969258</unstructured_citation></citation><citation key="ref3"><doi>10.1017/S0033291721002804</doi><unstructured_citation>J. N. de Boer et al., &quot;Acoustic speech markers for schizophrenia-spectrum disorders: A diagnostic and symptom-recognition tool,&quot; Psychol. Med., 2021, DOI: https://doi.org/10.1017/S0033291721002804</unstructured_citation></citation><citation key="ref4"><doi>10.1016/j.medengphy.2010.07.013</doi><unstructured_citation>V. Rapcan, S. D'Arcy, S. Yeap, N. Afzal, J. Thakore, and R. B. Reilly, &quot;Acoustic and temporal analysis of speech: A potential biomarker for schizophrenia,&quot; Med. Eng. Phys., vol. 32, no. 9, pp. 1074-1079, Nov. 2010, DOI: https://doi.org/10.1016/j.medengphy.2010.07.013</unstructured_citation></citation><citation key="ref5"><doi>10.1016/j.apacoust.2020.107344</doi><unstructured_citation>R. Makowski and R. Hossa, &quot;Voice activity detection with quasi-quadrature filters and GMM decomposition for speech and noise,&quot; Appl. Acoust., vol. 166, 2020, DOI: https://doi.org/10.1016/j.apacoust.2020.107344</unstructured_citation></citation><citation key="ref6"><doi>10.1186/s13636-018-0135-7</doi><unstructured_citation>S. Dwijayanti, K. Yamamori, and M. Miyoshi, &quot;Enhancement of speech dynamics for voice activity detection using DNN,&quot; Eurasip J. Audio, Speech, Music Process., vol. 2018, no. 1, 2018, DOI: https://doi.org/10.1186/s13636-018-0135-7</unstructured_citation></citation><citation key="ref7"><doi>10.21437/Interspeech.2020-2285</doi><unstructured_citation>M. Lavechin, M. P. Gill, R. Bousbib, H. Bredin, and L. P. Garcia-Perera, &quot;End-to-end domain-adversarial voice activity detection,&quot; in Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH, 2020. DOI: https://doi.org/10.21437/Interspeech.2020-2285</unstructured_citation></citation><citation key="ref8"><doi>10.1186/s13636-016-0092-y</doi><unstructured_citation>X.-K. Yang, L. He, D. Qu, and W.-Q. Zhang, &quot;Voice activity detection algorithm based on long-term pitch information,&quot; 2016, DOI: https://doi.org/10.1186/s13636-016-0092-y</unstructured_citation></citation><citation key="ref9"><doi>10.1109/SIVA.2018.8661045</doi><unstructured_citation>C. E. Chelloug and A. Farrouki, &quot;Robust Voice Activity Detection Against Non Homogeneous Noisy Environments,&quot; in 2018 International Conference on Signal, Image, Vision and their Applications, SIVA 2018, 2019. DOI: https://doi.org/10.1109/SIVA.2018.8661045</unstructured_citation></citation><citation key="ref10"><doi>10.1016/j.csl.2019.06.005</doi><unstructured_citation>Z. H. Tan, A. kr Sarkar, and N. Dehak, &quot;rVAD: An unsupervised segment-based robust voice activity detection method,&quot; Comput. Speech Lang., vol. 59, 2020, DOI: https://doi.org/10.1016/j.csl.2019.06.005</unstructured_citation></citation><citation key="ref11"><doi>10.1109/CCWC.2017.7868454</doi><unstructured_citation>J. Pang, &quot;Spectrum energy based voice activity detection,&quot; in 2017 IEEE 7th Annual Computing and Communication Workshop and Conference, CCWC 2017, 2017. DOI: https://doi.org/10.1109/CCWC.2017.7868454</unstructured_citation></citation><citation key="ref12"><doi>10.1109/ACCESS.2018.2805845</doi><unstructured_citation>Z. Ali and M. Talha, Innovative Method for Unsupervised Voice Activity Detection and Classification of Audio Segments, vol. 6. 2018. DOI: https://doi.org/10.1109/ACCESS.2018.2805845</unstructured_citation></citation><citation key="ref13"><doi>10.1088/1742-6596/705/1/012037</doi><unstructured_citation>P. D. Ortiz, L. F. Villa, C. Salazar, and O. L. Quintero, &quot;A simple but efficient voice activity detection algorithm through Hilbert transform and dynamic threshold for speech pathologies,&quot; J. Phys. Conf. Ser., vol. 705, no. 1, 2016, DOI: https://doi.org/10.1088/1742-6596/705/1/012037</unstructured_citation></citation><citation key="ref14"><doi>10.3390/e18080298</doi><unstructured_citation>R. J. Elton, P. Vasuki, and J. Mohanalin, &quot;Voice activity detection using fuzzy entropy and support vector machine,&quot; Entropy, vol. 18, no. 8, 2016, DOI: https://doi.org/10.3390/e18080298</unstructured_citation></citation><citation key="ref15"><doi>10.21437/Interspeech.2016-268</doi><unstructured_citation>R. Zazo, T. N. Sainath, G. Simko, and C. Parada, &quot;Feature learning with raw-waveform CLDNNs for Voice Activity Detection,&quot; in Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH, 2016. DOI: https://doi.org/10.21437/Interspeech.2016-268</unstructured_citation></citation><citation key="ref16"><unstructured_citation>A. Sehgal and N. Kehtarnavaz, &quot;A Convolutional Neural Network Smartphone App for Real-Time</unstructured_citation></citation><citation key="ref17"><doi>10.1109/ACCESS.2018.2800728</doi><unstructured_citation>Voice Activity Detection,&quot; IEEE Access, vol. 6, 2018, DOI: https://doi.org/10.1109/ACCESS.2018.2800728</unstructured_citation></citation><citation key="ref18"><doi>10.1109/ICECE.2018.8636745</doi><unstructured_citation>J. Dey, M. S. Bin Hossain, and M. A. Haque, &quot;An ensemble SVM-based approach for voice activity detection,&quot; in ICECE 2018 - 10th International Conference on Electrical and Computer Engineering, 2019. DOI: https://doi.org/10.1109/ICECE.2018.8636745</unstructured_citation></citation><citation key="ref19"><doi>10.1109/LSP.2015.2495219</doi><unstructured_citation>T. Drugman, Y. Stylianou, Y. Kida, and M. Akamine, &quot;Voice Activity Detection: Merging Source and Filter-based Information,&quot; IEEE Signal Process. Lett., vol. 23, no. 2, 2016, DOI: https://doi.org/10.1109/LSP.2015.2495219</unstructured_citation></citation><citation key="ref20"><doi>10.1515/9783110873429</doi><unstructured_citation>G. Fant, Acoustic Theory of Speech Production: With Calculations based on X-Ray Studies of Russian Articulations. Berlin: Gruyter Mouton, 1971. [Online]. Available: DOI: https://doi.org/10.1515/9783110873429</unstructured_citation></citation><citation key="ref21"><doi>10.1007/978-3-642-38013-6_2</doi><unstructured_citation>H. Uhrmann, R. Kolm, and H. Zimmermann, &quot;Analog Filters,&quot; Springer Ser. Adv. Microelectron., vol. 45, pp. 3-11, 2014, DOI: https://doi.org/10.1007/978-3-642-38013-6_2</unstructured_citation></citation><citation key="ref22"><doi>10.1155/2007/96384</doi><unstructured_citation>P. Händel, &quot;Power spectral density error analysis of spectral subtraction type of speech enhancement methods,&quot; EURASIP J. Adv. Signal Process., vol. 2007, 2007, DOI: https://doi.org/10.1155/2007/96384</unstructured_citation></citation><citation key="ref23"><doi>10.35940/ijeat.A1083.1291S319</doi><unstructured_citation>Das, P., Pathak, R., &amp; Beulet. P, A. S. (2019). Low Power Implementation Of Ternary Content Addressable Memory (TCAM). In International Journal of Engineering and Advanced Technology (Vol. 9, Issue 1s3, pp. 455-460). DOI: https://doi.org/10.35940/ijeat.A1083.1291S319</unstructured_citation></citation><citation key="ref24"><doi>10.35940/ijitee.A4998.119119</doi><unstructured_citation>Sharma, Dr. A., &amp; Sohal, Dr. H. (2019). Sleepy- Gate Diffusion Input (S-GDI)-Ultra Low Power Technique for Digital Design. In International Journal of Innovative Technology and Exploring Engineering (Vol. 9, Issue 1, pp. 4340-4347). DOI: https://doi.org/10.35940/ijitee.A4998.119119</unstructured_citation></citation><citation key="ref25"><doi>10.35940/ijrte.D4368.118419</doi><unstructured_citation>Chandra, K. S., Kishore, K. H., Giri, P., &amp; Reddy, E. S. (2019). Design of 8T CNTFET SRAM for Ultra-Low Power Microelectronic Applications. In International Journal of Recent Technology and Engineering (IJRTE) (Vol. 8, Issue 4, pp. 10148-10152). DOI: https://doi.org/10.35940/ijrte.D4368.118419</unstructured_citation></citation></citation_list>
</doi_citations>
</body>
</doi_batch>
