@inproceedings{wataru24apsipa_necobert,abbr_publisher={Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},booktitle={Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},title={NecoBERT: Self-Supervised Learning Model Trained by Masked Language Modeling on Rich Acoustic Features Derived from Neural Audio Codec},author={Nakata, Wataru and Saeki, Takaaki and Saito, Yuki and Takamichi, Shinnosuke and Saruwatari, Hiroshi},year={2024}}
Real-Time Noise Estimation for Lombard-Effect Speech Synthesis in Human–Avatar Dialogue Systems
@inproceedings{ishikawa24apsipa_lombard,abbr_publisher={Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},booktitle={Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)},title={Real-Time Noise Estimation for Lombard-Effect Speech Synthesis in Human–Avatar Dialogue Systems},author={Ishikawa, Yuto and Take, Osamu and Nakamura, Tomohiko and Takamune, Norihiro and Saito, Yuki and Takamichi, Shinnosuke and Saruwatari, Hiroshi},year={2024}}