Pub Date : 2024-04-14DOI: 10.1109/icassp48485.2024.10445852
Rui Zhang, Xiaoran Yan
{"title":"Video-Language Graph Convolutional Network for Human Action Recognition","authors":"Rui Zhang, Xiaoran Yan","doi":"10.1109/icassp48485.2024.10445852","DOIUrl":"https://doi.org/10.1109/icassp48485.2024.10445852","url":null,"abstract":"","PeriodicalId":517764,"journal":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","volume":"53 3","pages":""},"PeriodicalIF":0.0,"publicationDate":"2024-04-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"140705918","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2024-04-14DOI: 10.1109/icassp48485.2024.10446296
Hui Lu, Xixin Wu, Haohan Guo, Songxiang Liu, Zhiyong Wu, Helen M. Meng
{"title":"Unifying One-Shot Voice Conversion and Cloning with Disentangled Speech Representations","authors":"Hui Lu, Xixin Wu, Haohan Guo, Songxiang Liu, Zhiyong Wu, Helen M. Meng","doi":"10.1109/icassp48485.2024.10446296","DOIUrl":"https://doi.org/10.1109/icassp48485.2024.10446296","url":null,"abstract":"","PeriodicalId":517764,"journal":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","volume":"221 8","pages":""},"PeriodicalIF":0.0,"publicationDate":"2024-04-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"140704250","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2024-04-14DOI: 10.1109/icassp48485.2024.10448157
Mahmoud Namazi, Kenneth Rose
{"title":"Ultra-Low Delay Lossless Compression of Higher Order Ambisonics","authors":"Mahmoud Namazi, Kenneth Rose","doi":"10.1109/icassp48485.2024.10448157","DOIUrl":"https://doi.org/10.1109/icassp48485.2024.10448157","url":null,"abstract":"","PeriodicalId":517764,"journal":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","volume":"145 2","pages":""},"PeriodicalIF":0.0,"publicationDate":"2024-04-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"140704310","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2024-04-14DOI: 10.1109/icassp48485.2024.10446967
Lang Liu, Zaïd Harchaoui
{"title":"The Rao, Wald, And Likelihood-Ratio Tests under Generalized Self-Concordance","authors":"Lang Liu, Zaïd Harchaoui","doi":"10.1109/icassp48485.2024.10446967","DOIUrl":"https://doi.org/10.1109/icassp48485.2024.10446967","url":null,"abstract":"","PeriodicalId":517764,"journal":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","volume":"214 2","pages":""},"PeriodicalIF":0.0,"publicationDate":"2024-04-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"140704398","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2024-04-14DOI: 10.1109/icassp48485.2024.10446821
Patitapaban Palo, A. Routray, Ritesh Chandra Tewari
{"title":"A Graph Neural Network Based Approach for Fault Delineation in Seismic Data using Graph Total Variation and Multigraph","authors":"Patitapaban Palo, A. Routray, Ritesh Chandra Tewari","doi":"10.1109/icassp48485.2024.10446821","DOIUrl":"https://doi.org/10.1109/icassp48485.2024.10446821","url":null,"abstract":"","PeriodicalId":517764,"journal":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","volume":"33 2","pages":""},"PeriodicalIF":0.0,"publicationDate":"2024-04-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"140705603","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2024-04-14DOI: 10.1109/icassp48485.2024.10447201
Pavlo Hilei, Marian Petruk, Ievgen V. Korotkyi, Oleg Farenyuk
{"title":"Deep Learning AMR Model Inference Acceleration with CFU for Edge Systems","authors":"Pavlo Hilei, Marian Petruk, Ievgen V. Korotkyi, Oleg Farenyuk","doi":"10.1109/icassp48485.2024.10447201","DOIUrl":"https://doi.org/10.1109/icassp48485.2024.10447201","url":null,"abstract":"","PeriodicalId":517764,"journal":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","volume":"2 10","pages":""},"PeriodicalIF":0.0,"publicationDate":"2024-04-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"140705849","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2024-04-14DOI: 10.1109/icassp48485.2024.10446808
Feng Ding, Xiu Liu, Xinyi Wang, Fangming Zhong
{"title":"Dual-Mix for Cross-Modal Retrieval with Noisy Labels","authors":"Feng Ding, Xiu Liu, Xinyi Wang, Fangming Zhong","doi":"10.1109/icassp48485.2024.10446808","DOIUrl":"https://doi.org/10.1109/icassp48485.2024.10446808","url":null,"abstract":"","PeriodicalId":517764,"journal":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","volume":"184 5","pages":""},"PeriodicalIF":0.0,"publicationDate":"2024-04-14","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"140706578","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}