Repository for Language Models can Self-Improve at State-Value Estimation for Better Search
Code and data coming soon!
@misc{mendes2025languagemodelsselfimprovestatevalue,
title={Language Models can Self-Improve at State-Value Estimation for Better Search},
author={Ethan Mendes and Alan Ritter},
year={2025},
eprint={2503.02878},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2503.02878},
}