@article{ author = {Mohadese EshaghiandFarbod RazzaziandAlireza Behrad}, title = {A New VAD Algorithm using Sparse Representation in Spectro-Temporal Domain}, journal = {Journal of Information Systems and Telecommunication (JIST) }, volume = {7}, number = {1}, page = {74-87}, year = {2019}, publisher = {Iranian Academic Center for Education,Culture and Research }, issn = {2322-1437}, eissn = {2345-2773}, doi = {10.7508/jist.2019.01.007}, abstract = {This paper proposes two algorithms for Voice Activity Detection (VAD) based on sparse representation in spectro-temporal domain. The first algorithm was made using two-dimensional STRF (Spectro-Temporal Response Field) space based on sparse representation. Dictionaries with different atomic sizes and two dictionary learning methods were investigated in this approach. This algorithm revealed good results at high SNRs (signal-to-noise ratio). The second algorithm, whose approach is more complicated, suggests a speech detector using the sparse representation in four-dimensional STRF space. Due to the large volume of STRF's four-dimensional space, this space was divided into cubes, with dictionaries made for each cube separately by NMF (non-negative matrix factorization) learning algorithm. Simulation results were presented to illustrate the effectiveness of our new VAD algorithms. The results revealed that the achieved performance was 90.11% and 91.75% under -5 dB SNR in white and car noise respectively, outperforming most of the state-of-the-art VAD algorithms.}, keywords = {Speech Processing,Voice Activity Detector (VAD),Spectro-Temporal Domain Representation,Sparse Representation,NMF,K-SVD}, title_fa = {A New VAD Algorithm using Sparse Representation in Spectro-Temporal Domain}, abstract_fa = {This paper proposes two algorithms for Voice Activity Detection (VAD) based on sparse representation in spectro-temporal domain. The first algorithm was made using two-dimensional STRF (Spectro-Temporal Response Field) space based on sparse representation. Dictionaries with different atomic sizes and two dictionary learning methods were investigated in this approach. This algorithm revealed good results at high SNRs (signal-to-noise ratio). The second algorithm, whose approach is more complicated, suggests a speech detector using the sparse representation in four-dimensional STRF space. Due to the large volume of STRF's four-dimensional space, this space was divided into cubes, with dictionaries made for each cube separately by NMF (non-negative matrix factorization) learning algorithm. Simulation results were presented to illustrate the effectiveness of our new VAD algorithms. The results revealed that the achieved performance was 90.11% and 91.75% under -5 dB SNR in white and car noise respectively, outperforming most of the state-of-the-art VAD algorithms.}, keywords_fa = {Speech Processing ,Voice Activity Detector (VAD) ,Spectro-Temporal Domain Representation ,Sparse Representation ,NMF ,K-SVD}, URL = {rimag.ir/fa/Article/15253}, eprint = {rimag.ir/fa/Article/Download/15253},