Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

update publication #168

Merged
merged 1 commit into from
Sep 29, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
163 changes: 163 additions & 0 deletions _bibliography/papers.bib
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,169 @@ @string{WASPAA
@string{APSIPA = {Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)}}
@string{ICML = {Proceedings of the International Conference on Machine Learning (ICML)}}
@string{ICLR = {Proceedings of the International Conference on Learning Representations (ICLR)}}
@string{NeurIPS = {Proceedings of the Conference on Neural Information Processing Systems}}


@inproceddings{chou2023evaluating,
abbr={ASR},
abbr_publisher={ASRU},
title={Evaluating Self-supervised Speech Models on a Taiwanese Hokkien Corpus},
author={Yi-Hui Chou and Kalvin Chang and Meng-Ju Wu and Winston Ou and Alice Wen-Hsin Bi and Carol Yang and Bryan Y. Chen and Rong-Wei Pai and Po-Yen Yeh and Jo-Peng Chiang and Lu-Tshiann Phoann and Winnie Chang and Chenxuan Cui and Noel Chen and Jiatong Shi},
booktitle=ASRU,
year={2023},
publisher={IEEE},

}

@inproceedings{huang2023singing,
abbr={SVC},
abbr_publisher={ASRU},
title={The Singing Voice Conversion Challenge 2023},
author={Wen-Chin Huang and Lester Phillip Violeta and Songxiang Liu and Jiatong Shi and Tomoki Toda},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{shiohara2023domain,
abbr={ASR},
abbr_publisher={ASRU},
title={Domain Adaptation by Data Distribution Matching via Submodularity for Speech Recognition},
author={Yusuke Shinohara and Shinji Watanabe},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{kano2023summarize,
abbr={Summarization&ST},
abbr_publisher={ASRU},
title={Summarize while Translating: Universal Model with Parallel Decoding for Summarization and Translation},
author={Takatomo Kano and Atsunori Ogawa and Marc Delcroix and Kohei Matsuura and Takanori Ashihara and William Chen and Shinji Watanabe},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{li2023yodas,
abbr={ASR},
abbr_publisher={ASRU},
title={YODAS: Youtube-Oriented Dataset for Audio and Speech},
author={Xinjian Li and Shinnosuke Takamichi and Takaaki Saeki and William Chen and Sayaka Shiota and Shinji Watanabe},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{kohei2023single,
abbr={SE&SS},
abbr_publisher={ASRU},
title={A Single Speech Enhancement Model Unifying Dereverberation, Denoising, Speaker Counting, Separation, and Extraction},
author={Kohei Saijo and Wangyou Zhang and Zhong-Qiu Wang and Shinji Watanabe and Tetsunori Kobayashi and Tetsuji Ogawa},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{wang2023torchaudio,
abbr={ASR&SSL},
abbr_publisher={ASRU},
title={TorchAudio 2.1: Advancing speech recognition, self-supervised learning, and audio processing components for PyTorch},
author={Jeff Hwang and Moto Hira and Caroline Chen and Xiaohui Zhang and Zhaoheng Ni and Guangzhi Sun and Pingchuan Ma and Ruizhe Huang and Vineel Pratap and Yuekai Zhang and Anurag Kumar and Chin-Yun Yu and Chuang Zhu and Chunxi Liu and Jacob Kahn and Mirco Ravanelli and Peng Sun and Shinji Watanabe and Yangyang Shi and Yumeng Tao},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{zhang2023toward,
abbr={SE},
abbr_publisher={ASRU},
title={Toward Universal Speech Enhancement For Diverse Input Conditions},
author={Wangyou Zhang and Kohei Saijo and Zhong-Qiu Wang and Shinji Watanabe and Yanmin Qian},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{shi2023findings,
abbr={ASR},
abbr_publisher={ASRU},
title={Findings of the 2023 ML-SUPERB Challenge: Pre-Training and Evaluation over More Languages and Beyond},
author={Jiatong Shi and William Chen and Dan Berrebbi and Hsiu-Hsuan Wang and Wei Ping Huang and En Pei Hu and ho lam Chung and Xuankai Chang and Yuxun Tang and Shang-Wen Li and Abdelrahman Mohamed and Hung-yi Lee and Shinji Watanabe},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{chen2023joint,
abbr={SSL},
abbr_publisher={ASRU},
title={Joint Prediction and Denoising for Large-Scale Multilingual Self-Supervised Learning},
author={William Chen and Jiatong Shi and Brian Yan and Dan Berrebbi and Wangyou Zhang and Yifan Peng and Xuankai Chang and Soumi Maiti and Shinji Watanabe},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{someki2023segment,
abbr={ASR},
abbr_publisher={ASRU},
title={Segment-Level Vectorized Beam Search Based on Partially Autoregressive Inference},
author={Masao Someki and Nicholas Eng and Yosuke Higuchi and Shinji Watanabe},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{peng2023reproducing,
abbr={ASR&ST},
abbr_publisher={ASRU},
title={Reproducing Whisper-Style Training Using an Open-Source Toolkit and Publicly Available Data},
author={Yifan Peng and Jinchuan Tian and Brian Yan and Dan Berrebbi and Xuankai Chang and Xinjian Li and Jiatong Shi and Siddhant Arora and William Chen and Roshan Sharma and Wangyou Zhang and Yui Sudo and Muhammad Shakeel and Jee-weon Jung and Soumi Maiti and Shinji Watanabe},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{roshan2023espnet,
abbr={Summarization},
abbr_publisher={ASRU},
title={ESPNet-SUMM: Introducing a novel large dataset, toolkit, and a cross-corpora evaluation of speech summarization systems},
author={Roshan Sharma and William Chen and Takatomo Kano and Ruchira Sharma and Atsunori Ogawa and Siddhant Arora and Marc Delcroix and Rita Singh and Shinji Watanabe and Bhiksha Raj},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}


@inproceedings{fujita2023lvctc,
abbr={ASR},
abbr_publisher={ASRU},
title={LV-CTC: Non-autoregressive ASR with CTC and latent variable models},
author={Yuya Fujita and Shinji Watanabe and Xuankai Chang and Takashi Maekaku},
booktitle=ASRU,
year={2023},
publisher={IEEE},
}

@inproceedings{wang2023unssor,
abbr={SS},
abbr_publisher={NeurIPS},
title={UNSSOR: Unsupervised Neural Speech Separation by Leveraging Over-determined Training Mixtures},
author={Zhong-Qiu Wang and Shinji Watanabe},
booktitle=NeurIPS,
year={2023},
}

@inproceedings{masuyama2023exploring,
abbr={SS},
abbr_publisher={WASPAA},
title={Exploring the Integration of Speech Separation and Recognition with Self-Supervised Learning Representation},
author={Yoshiki Masuyama and Xuankai Chang and Wangyou Zhang and Samuele Cornell and Zhong-Qiu Wang and Nobutaka Ono and Yanmin Qian and Shinji Watanabe},
booktitle=WASPAA,
year={2023},
}


@article{maciejewski2023adilemma,
abbr={SS},
Expand Down
Loading
Loading