Pub Date : 2023-12-28DOI: 10.1007/s10772-023-10079-0
Souha Ayadi, Z. Lachiri
{"title":"Deep neural network architectures for audio emotion recognition performed on song and speech modalities","authors":"Souha Ayadi, Z. Lachiri","doi":"10.1007/s10772-023-10079-0","DOIUrl":"https://doi.org/10.1007/s10772-023-10079-0","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"197 3","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-12-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"139152878","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-12-23DOI: 10.1007/s10772-023-10075-4
Noor D. Al-Shakarchy, Huda Rageb, Mais Saad Safoq
{"title":"Gender and age-evolution detection based on audio forensic analysis using light deep neural network","authors":"Noor D. Al-Shakarchy, Huda Rageb, Mais Saad Safoq","doi":"10.1007/s10772-023-10075-4","DOIUrl":"https://doi.org/10.1007/s10772-023-10075-4","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"7 10","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-12-23","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"139161461","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-12-22DOI: 10.1007/s10772-023-10074-5
Khamis A. AL-KARAWI
{"title":"Real-time adaptive training for forensic speaker verification in reverberation conditions","authors":"Khamis A. AL-KARAWI","doi":"10.1007/s10772-023-10074-5","DOIUrl":"https://doi.org/10.1007/s10772-023-10074-5","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"3 4","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-12-22","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"138946111","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-12-21DOI: 10.1007/s10772-023-10072-7
Gebremichael Kibret Sheferaw, W. Mwangi, Michael Kimwele, A. Mamuye
{"title":"Waveform based speech coding using nonlinear predictive techniques: a systematic review","authors":"Gebremichael Kibret Sheferaw, W. Mwangi, Michael Kimwele, A. Mamuye","doi":"10.1007/s10772-023-10072-7","DOIUrl":"https://doi.org/10.1007/s10772-023-10072-7","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"49 15","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-12-21","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"138952581","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-12-19DOI: 10.1007/s10772-023-10076-3
K. Nataraj, Prem C. Pandey, H. Dasgupta
{"title":"Estimation of place of articulation of fricatives from spectral features","authors":"K. Nataraj, Prem C. Pandey, H. Dasgupta","doi":"10.1007/s10772-023-10076-3","DOIUrl":"https://doi.org/10.1007/s10772-023-10076-3","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":" 27","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-12-19","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"138962215","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-12-13DOI: 10.1007/s10772-023-10071-8
R. Rajan, T. V. Hridya Raj
{"title":"SENet-based speech emotion recognition using synthesis-style transfer data augmentation","authors":"R. Rajan, T. V. Hridya Raj","doi":"10.1007/s10772-023-10071-8","DOIUrl":"https://doi.org/10.1007/s10772-023-10071-8","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"34 1","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-12-13","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"139006615","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-11-29DOI: 10.1007/s10772-023-10070-9
Chiron Bang, Nicholas Bogdanovic, Gali Deutsch, Oge Marques
{"title":"Machine learning for the diagnosis of Parkinson’s disease using speech analysis: a systematic review","authors":"Chiron Bang, Nicholas Bogdanovic, Gali Deutsch, Oge Marques","doi":"10.1007/s10772-023-10070-9","DOIUrl":"https://doi.org/10.1007/s10772-023-10070-9","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"50 1","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-11-29","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"139210302","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-11-22DOI: 10.1007/s10772-023-10068-3
Sudhansu Sekhar Nayak, A. D. Darji, Prashant K. Shah
{"title":"Identification of Parkinson’s disease from speech signal using machine learning approach","authors":"Sudhansu Sekhar Nayak, A. D. Darji, Prashant K. Shah","doi":"10.1007/s10772-023-10068-3","DOIUrl":"https://doi.org/10.1007/s10772-023-10068-3","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"37 3","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-11-22","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"139246917","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2023-11-20DOI: 10.1007/s10772-023-10069-2
Aluru V. N. M. Hemateja, Gopikrishnan Kondakath, Susruta Das, Mohanaprasad Kothandaraman, S. Shoba, Abhishek Pandey, Rajin Babu, Abhinav Jain
{"title":"Correction to: Novel data augmentation for named entity recognition","authors":"Aluru V. N. M. Hemateja, Gopikrishnan Kondakath, Susruta Das, Mohanaprasad Kothandaraman, S. Shoba, Abhishek Pandey, Rajin Babu, Abhinav Jain","doi":"10.1007/s10772-023-10069-2","DOIUrl":"https://doi.org/10.1007/s10772-023-10069-2","url":null,"abstract":"","PeriodicalId":14305,"journal":{"name":"International Journal of Speech Technology","volume":"43 6","pages":""},"PeriodicalIF":0.0,"publicationDate":"2023-11-20","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"139258395","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}