@inproceedings{chien2024learning,title={Learning Fine-Grained Controllability on Speech Generation via Efficient Fine-Tuning},author={Chien, Chung-Ming and Tjandra, Andros and Vyas, Apoorv and Le, Matt and Shi, Bowen and Hsu, Wei-Ning},year={2024},booktitle={Interspeech 2024},month=sep,eprint={2406.06251},archiveprefix={arXiv},primaryclass={eess.AS},}
@inproceedings{arora2024on,title={On the Evaluation of Speech Foundation Models for Spoken Language Understanding},author={Arora, Siddhant and Pasad, Ankita and Chien, Chung-Ming and Han, Jionghao and Sharma, Roshan and Jung, Jee-weon and Dhamyal, Hira and Chen, William and Shon, Suwon and Lee, Hung-yi and Livescu, Karen and Watanabe, Shinji},booktitle={Findings of the Association for Computational Linguistics ACL 2024},year={2024},month=aug,eprint={2406.10083},archiveprefix={arXiv},primaryclass={cs.CL},}
@inproceedings{chou2023av2wav,title={AV2Wav: Diffusion-Based Re-synthesis from Continuous Self-supervised Features for Audio-Visual Speech Enhancement},author={Chou, Ju-Chieh and Chien, Chung-Ming and Livescu, Karen},booktitle={ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},year={2024},month=apr,eprint={2309.08030},archiveprefix={arXiv},primaryclass={eess.AS},}
@article{pasad2023what,title={What Do Self-Supervised Speech Models Know about Words?},author={Pasad, Ankita and Chien, Chung-Ming and Settle, Shane and Livescu, Karen},journal={Transactions of the Association for Computational Linguistics},volume={12},pages={372-391},year={2024},month=apr,issn={2307-387X},doi={10.1162/tacl_a_00656},eprint={2307.00162},archiveprefix={arXiv},primaryclass={cs.CL},}
@inproceedings{chien2023few,title={Few-Shot Spoken Language Understanding via Joint Speech-Text Models},author={Chien, Chung-Ming and Zhang, Mingjiamei and Chou, Ju-Chieh and Livescu, Karen},booktitle={2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)},year={2023},month=dec,eprint={2310.05919},archiveprefix={arXiv},primaryclass={cs.CL},}
@inproceedings{chou2023toward,title={Toward Joint Language Modeling for Speech Units and Text},author={Chou, Ju-Chieh and Chien, Chung-Ming and Hsu, Wei-Ning and Livescu, Karen and Babu, Arun and Conneau, Alexis and Baevski, Alexei and Auli, Michael},booktitle={Findings of the Association for Computational Linguistics: EMNLP 2023},year={2023},pages={6582--6593},doi={10.18653/v1/2023.findings-emnlp.438"},month=dec,url={https://aclanthology.org/2023.findings-emnlp.438},eprint={2310.08715},archiveprefix={arXiv},primaryclass={cs.CL},}
@inproceedings{gabrys2022voice,author={Gabry\'s, Adam and Huybrechts, Goeric and Ribeiro, Manuel Sam and Chien, Chung-Ming and Roth, Julian and Comini, Giulia and Barra-Chicote, Roberto and Perz, Bartek and Lorenzo-Trueba, Jaime},booktitle={ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},title={Voice Filter: Few-Shot Text-to-Speech Speaker Adaptation Using Voice Conversion as a Post-Processing Module},year={2022},volume={},number={},pages={7902-7906},doi={10.1109/ICASSP43922.2022.9747239},month=may,eprint={2202.08164},archiveprefix={arXiv},primaryclass={eess.AS},}
@inproceedings{lin2021s2vc,author={Lin, Jheng-hao and Lin, Yist Y. and Chien, Chung-Ming and Lee, Hung-yi},title={S2VC: A Framework for Any-to-Any Voice Conversion with Self-Supervised Pretrained Representations},year={2021},booktitle={Proc. Interspeech 2021},pages={836--840},doi={10.21437/Interspeech.2021-1356},month=aug,eprint={2104.02901},archiveprefix={arXiv},primaryclass={eess.AS},}
@inproceedings{chien2021investigating,author={Chien, Chung-Ming and Lin, Jheng-Hao and Huang, Chien-yu and Hsu, Po-chun and Lee, Hung-yi},booktitle={ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},title={Investigating on Incorporating Pretrained and Learnable Speaker Representations for Multi-Speaker Multi-Style Text-to-Speech},year={2021},volume={},number={},pages={8588-8592},doi={10.1109/ICASSP39728.2021.9413880},month=jun,eprint={2103.04088},archiveprefix={arXiv},primaryclass={eess.AS},}
@inproceedings{chien2020fragmentvc,author={Chien*, Chung-Ming and Lin*, Yist Y. and Lin, Jheng-Hao and Lee, Hung-yi and Lee, Lin-shan},booktitle={ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},title={FragmentVC: Any-To-Any Voice Conversion by End-To-End Extracting and Fusing Fine-Grained Voice Fragments with Attention},year={2021},volume={},number={},pages={5939-5943},doi={10.1109/ICASSP39728.2021.9413699},month=jun,eprint={2010.14150},archiveprefix={arXiv},primaryclass={eess.AS},}