<?xml version="1.0" encoding="US-ASCII"?>
<dblp>
<article key="journals/corr/abs-2512-05126" publtype="informal" mdate="2026-04-07">
<author>Kaidi Wang</author>
<author>Yi He</author>
<author>Wenhao Guan</author>
<author>Weijie Wu</author>
<author>Hongwu Ding</author>
<author>Xiong Zhang</author>
<author>Di Wu</author>
<author orcid="0009-0004-2839-6286">Meng Meng</author>
<author>Jian Luan 0001</author>
<author>Lin Li</author>
<author>Qingyang Hong</author>
<title>SyncVoice: Towards Video Dubbing with Vision-Augmented Pretrained TTS Model.</title>
<year>2025</year>
<month>December</month>
<volume>abs/2512.05126</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2512.05126</ee>
<url>db/journals/corr/corr2512.html#abs-2512-05126</url>
<stream>streams/journals/corr</stream>
</article>
</dblp>
