{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T13:25:00Z","timestamp":1778246700299,"version":"3.51.4"},"reference-count":42,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,5,30]]},"DOI":"10.1109\/icra48506.2021.9561548","type":"proceedings-article","created":{"date-parts":[[2021,10,20]],"date-time":"2021-10-20T00:28:35Z","timestamp":1634689715000},"page":"6541-6548","source":"Crossref","is-referenced-by-count":66,"title":["Hierarchical Planning for Long-Horizon Manipulation with Geometric and Symbolic Scene Graphs"],"prefix":"10.1109","author":[{"given":"Yifeng","family":"Zhu","sequence":"first","affiliation":[{"name":"NVIDIA"}]},{"given":"Jonathan","family":"Tremblay","sequence":"additional","affiliation":[{"name":"NVIDIA"}]},{"given":"Stan","family":"Birchfield","sequence":"additional","affiliation":[{"name":"NVIDIA"}]},{"given":"Yuke","family":"Zhu","sequence":"additional","affiliation":[{"name":"NVIDIA"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2019.2894861"},{"key":"ref38","article-title":"Embed to control: A locally linear latent dynamics model for control from raw images","author":"watter","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref33","first-page":"1930","article-title":"Logic-geometric programming: An optimization-based approach to combined task and motion planning","author":"toussaint","year":"2015","journal-title":"IJCAI"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2014.6906922"},{"key":"ref31","first-page":"979","article-title":"Graph-structured visual imitation","author":"sieb","year":"2020","journal-title":"Conference on Robot Learning"},{"key":"ref30","article-title":"Fast uncertainty quantification for deep object pose estimation","author":"shi","year":"2021","journal-title":"International Conference on Robotics and Automation (ICRA)"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8594027"},{"key":"ref36","article-title":"6-DoF pose estimation of household objects for robotic manipulation: An accessible dataset and benchmark","author":"tyree","year":"2019","journal-title":"ICCV Workshop on Recovering 6D Object Pose"},{"key":"ref35","article-title":"Deep object pose estimation for semantic robotic grasping of household objects","author":"tremblay","year":"2018","journal-title":"Conference on Robot Learning"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2018.XIV.044"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"440","DOI":"10.1609\/icaps.v30i1.6739","article-title":"Pddlstream: Integrating symbolic planners and blackbox samplers via optimistic adaptive planning","volume":"30","author":"garrett","year":"2020","journal-title":"Proceedings of the International Conference on Automated Planning and Scheduling"},{"key":"ref40","first-page":"1317","article-title":"Regression planning networks","author":"xu","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref11","article-title":"Dream to control: Learning behaviors by latent imagination","author":"hafner","year":"2019","journal-title":"International Conference on Learning Representations"},{"key":"ref12","first-page":"2555","article-title":"Learning latent dynamics for planning from pixels","author":"hafner","year":"2019","journal-title":"International Conference on Machine Learning"},{"key":"ref13","article-title":"Relational inductive bias for physical construction in humans and machines","author":"hamrick","year":"2018"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9197172"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8967761"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2011.5980391"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1177\/0278364919848837"},{"key":"ref18","article-title":"Contrastive learning of structured world models","author":"kipf","year":"2019","journal-title":"International Conference on Learning Representations"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-016-0981-7"},{"key":"ref28","article-title":"Long-horizon visual planning with goal-conditioned hierarchical predictors","author":"pertsch","year":"2020"},{"key":"ref4","article-title":"Discovering symbolic models from deep learning with inductive biases","author":"cranmer","year":"2020"},{"key":"ref27","first-page":"2863","article-title":"Action-conditional video prediction using deep networks in atari games","author":"oh","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2016.7487165"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2020.XVI.003"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2020.XVI.079"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2016.XII.002"},{"key":"ref8","article-title":"Dynamics learning with cascaded variational inference for multi-step manipulation","author":"fang","year":"2019","journal-title":"Conference on Robot Learning (CoRL)"},{"key":"ref7","article-title":"GENESIS: Generative scene inference and sampling with object-centric latent representations","author":"engelcke","year":"2020","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref2","article-title":"MONet: Unsupervised scene decomposition and representation","author":"burgess","year":"2019"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989324"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00576"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511546877"},{"key":"ref22","article-title":"Learning latent plans from play","author":"lynch","year":"2020","journal-title":"Conference on Robot Learning"},{"key":"ref21","article-title":"Space: Unsupervised object-oriented scene representation via spatial attention and decomposition","author":"lin","year":"2020","journal-title":"International Conference on Learning Representations"},{"key":"ref42","article-title":"Object-centric forward modeling for model predictive control","author":"ye","year":"2019","journal-title":"Conference on Robot Learning (CoRL)"},{"key":"ref24","author":"morrical","year":"2020","journal-title":"NVISII Nvidia scene imaging interface"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.330"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.2965875"},{"key":"ref26","article-title":"Planning with goal-conditioned policies","author":"nasiriany","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref25","article-title":"Hierarchical foresight: Self-supervised learning of long-horizon tasks via visual subgoal generation","author":"nair","year":"2019","journal-title":"International Conference on Learning Representations"}],"event":{"name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","location":"Xi'an, China","start":{"date-parts":[[2021,5,30]]},"end":{"date-parts":[[2021,6,5]]}},"container-title":["2021 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9560720\/9560666\/09561548.pdf?arnumber=9561548","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,12]],"date-time":"2023-01-12T22:54:20Z","timestamp":1673564060000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9561548\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,30]]},"references-count":42,"URL":"https:\/\/doi.org\/10.1109\/icra48506.2021.9561548","relation":{},"subject":[],"published":{"date-parts":[[2021,5,30]]}}}