Towards Efficient and Multifaceted Computer-assisted Pronunciation Training Leveraging Hierarchical Selective State Space Model and Decoupled Cross-entropy Loss
Fu-An Chao, and Berlin Chen
In the Nations of the Americas Chapter of the Association for Computational Linguistics (NAACL), 2025
@inproceedings{chao2025efficientmultifacetedcomputerassistedpronunciation,title={Towards Efficient and Multifaceted Computer-assisted Pronunciation Training Leveraging Hierarchical Selective State Space Model and Decoupled Cross-entropy Loss},author={Chao, Fu-An and Chen, Berlin},booktitle={the Nations of the Americas Chapter of the Association for Computational Linguistics (NAACL)},year={2025},}
@inproceedings{lo2024effective,title={An Effective Automated Speaking Assessment Approach to Mitigating Data Scarcity and Imbalanced Distribution},author={Lo, Tien-Hong and Chao, Fu-An and Wu, Tzu-I and Sung, Yao-Ting and Chen, Berlin},booktitle={Findings of Annual Conference of the North American Chapter of the Association for Computational Linguistics (NAACL)},year={2024},pages={1352--1362},doi={10.18653/v1/2024.findings-naacl.86},}
@inproceedings{chao23hierarchical,author={Chao, Fu-An and Lo, Tien-Hong and Wu, Tzu-I and Sung, Yao-Ting and Chen, Berlin},title={{A Hierarchical Context-aware Modeling Approach for Multi-aspect and Multi-granular Pronunciation Assessment}},booktitle={the 24st Annual Conference of the International Speech Communication Association (Interspeech)},year={2023},pages={974--978},doi={10.21437/Interspeech.2023-550},}
@inproceedings{chao20223m,title={3m: An effective multi-view, multi-granularity, and multi-aspect modeling approach to english pronunciation assessment},author={Chao, Fu-An and Lo, Tien-Hong and Wu, Tzu-I and Sung, Yao-Ting and Chen, Berlin},booktitle={Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},organization={IEEE},year={2022},pages={575--582},doi={10.23919/APSIPAASC55919.2022.9979979},}
@article{chao2021time,title={Time-Reversal Enhancement Network With Cross-Domain Information for Noise-Robust Speech Recognition},author={Chao, Fu-An and Hung, Jeih-Weih and Sheu, Tommy and Chen, Berlin},journal={IEEE MultiMedia},publisher={IEEE},year={2021},volume={29},number={1},pages={114--124},doi={10.1109/MMUL.2021.3139302},}
@inproceedings{chao2021tenet,title={TENET: A time-reversal enhancement network for noise-robust ASR},author={Chao, Fu-An and Jiang, Shao-Wei Fan and Yan, Bi-Cheng and Hung, Jeih-weih and Chen, Berlin},booktitle={IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)},organization={IEEE},year={2021},pages={55--61},doi={10.1109/ASRU51503.2021.9687924},}
@inproceedings{chao2021cross,title={Cross-domain single-channel speech enhancement model with bi-projection fusion module for noise-robust ASR},author={Chao, Fu-An and Hung, Jeih-weih and Chen, Berlin},booktitle={IEEE international conference on multimedia and expo (ICME)},organization={IEEE},year={2021},pages={1--6},doi={10.1109/ICME51207.2021.9428157},}