@inproceedings{bbbbd61d56eb4306a83086cf3033ae4b,
title = "STEP Planner: Constructing cross-hierarchical subgoal tree as an embodied long-horizon task planner",
abstract = "The ability to perform reliable long-horizon task planning is crucial for deploying robots in real-world environments. However, directly employing Large Language Models (LLMs) as action sequence generators often results in low success rates due to their limited reasoning ability for long-horizon embodied tasks. In the STEP framework, we construct a subgoal tree through a pair of closed-loop models: a subgoal decomposition model and a leaf node termination model. Within this framework, we develop a hierarchical tree structure that spans from coarse to fine resolutions. The subgoal decomposition model leverages a foundation LLM to break down complex goals into manageable subgoals, thereby spanning the subgoal tree. The leaf node termination model provides real-time feedback based on environmental states, determining when to terminate the tree spanning and ensuring each leaf node can be directly converted into a primitive action. Experiments conducted in both the VirtualHome WAH-NL benchmark and on real robots demonstrate that STEP achieves long-horizon embodied task completion with success rates up to 34\% (WAH-NL) and 25\% (real robot) outperforming SOTA methods.",
author = "Tianxing Zhou and Zhirui Wang and Haojia Ao and Guangyan Chen and Boyang Xing and Jingwen Cheng and Yi Yang and Yufeng Yue",
note = "Publisher Copyright: {\textcopyright} 2025 IEEE.; 2025 IEEE/RSJ International Conference on Intelligent Robots and Systems, IROS 2025 ; Conference date: 19-10-2025 Through 25-10-2025",
year = "2025",
doi = "10.1109/IROS60139.2025.11246104",
language = "English",
series = "IEEE International Conference on Intelligent Robots and Systems",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "16731--16738",
editor = "Christian Laugier and Alessandro Renzaglia and Nikolay Atanasov and Stan Birchfield and Grzegorz Cielniak and \{De Mattos\}, Leonardo and Laura Fiorini and Philippe Giguere and Kenji Hashimoto and Javier Ibanez-Guzman and Tetsushi Kamegawa and Jinoh Lee and Giuseppe Loianno and Kevin Luck and Hisataka Maruyama and Philippe Martinet and Hadi Moradi and Urbano Nunes and Julien Pettre and Alberto Pretto and Tommaso Ranzani and Arne Ronnau and Silvia Rossi and Elliott Rouse and Fabio Ruggiero and Olivier Simonin and Danwei Wang and Ming Yang and Eiichi Yoshida and Huijing Zhao",
booktitle = "IROS 2025 - 2025 IEEE/RSJ International Conference on Intelligent Robots and Systems, Conference Proceedings",
address = "United States",
}