Varun Dhanraj and Chris Eliasmith. Improving reasoning and planning capabilities of language models using reinforcement learning. In Mediterranean Machine Learning Summer School 2024. 2024.
@inproceedings{dhanraj2024,
title={Improving Reasoning and Planning Capabilities of Language Models using Reinforcement Learning},
author={Varun Dhanraj and Chris Eliasmith},
year={2024},
poster={http://compneuro.uwaterloo.ca/files/Dhanraj_Milan_2024.pdf},
booktitle={Mediterranean Machine Learning Summer School 2024},
}