<?xml version="1.0" encoding="US-ASCII"?>
<dblp>
<article key="journals/corr/abs-2304-09116" publtype="informal" mdate="2025-10-27">
<author>Kai Shen</author>
<author>Zeqian Ju</author>
<author>Xu Tan 0003</author>
<author>Yanqing Liu</author>
<author>Yichong Leng</author>
<author>Lei He 0005</author>
<author>Tao Qin 0001</author>
<author>Sheng Zhao 0002</author>
<author>Jiang Bian 0002</author>
<title>NaturalSpeech 2: Latent Diffusion Models are Natural and Zero-Shot Speech and Singing Synthesizers.</title>
<year>2023</year>
<volume>abs/2304.09116</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2304.09116</ee>
<url>db/journals/corr/corr2304.html#abs-2304-09116</url>
</article>
</dblp>
