<?xml version="1.0" encoding="US-ASCII"?>
<dblp>
<article key="journals/corr/abs-2410-16162" publtype="informal" mdate="2026-02-09">
<author>Yihong Tang</author>
<author>Ao Qu</author>
<author>Zhaokai Wang</author>
<author>Dingyi Zhuang</author>
<author>Zhaofeng Wu</author>
<author>Wei Ma</author>
<author>Shenhao Wang</author>
<author>Yunhan Zheng</author>
<author>Zhan Zhao</author>
<author>Jinhua Zhao 0001</author>
<title>Sparkle: Mastering Basic Spatial Capabilities in Vision Language Models Elicits Generalization to Composite Spatial Reasoning.</title>
<year>2024</year>
<volume>abs/2410.16162</volume>
<journal>CoRR</journal>
<ee type="oa">https://doi.org/10.48550/arXiv.2410.16162</ee>
<url>db/journals/corr/corr2410.html#abs-2410-16162</url>
<stream>streams/journals/corr</stream>
</article>
</dblp>
