@inproceedings{moon2025learning, title={Learning to Better Search with Language Models via Guided Reinforced Self-Training}, author={Seungyong Moon and Bumsoo Park and Hyun Oh Song}, booktitle={Neural Information Processing Systems}, year={2025} }