@inproceedings{pavse2025stable,
archiveprefix = {arXiv},
author = {Brahma S. Pavse and Yudong Chen and Qiaomin Xie and Josiah P. Hanna},
booktitle = {Proceedings of the 42nd International Conference on Machine Learning (ICML)},
eprint = {2410.01643},
month = {July},
primaryclass = {cs.LG},
title = {Stable Offline Value Function Learning with Bisimulation-based Representations},
url = {https://arxiv.org/abs/2410.01643},
year = {2025}
}
@inproceedings{pavse2024stabilize,
archiveprefix = {arXiv},
author = {Brahma S. Pavse and Matthew Zurek and Yudong Chen and Qiaomin Xie and Josiah P. Hanna},
booktitle = {Proceedings of the 41st International Conference on Machine Learning (ICML)},
eprint = {2306.01896},
month = {July},
primaryclass = {cs.LG},
title = {Learning to Stabilize Online Reinforcement Learning in Unbounded State Spaces},
url = {https://arxiv.org/abs/2306.01896},
year = {2024}
}
@inproceedings{pavse2023absmis,
address = {Washington, DC, USA},
author = {Brahma S. Pavse and Josiah P. Hanna},
booktitle = {Proceedings of the 37th AAAI Conference on Artificial Intelligence (AAAI)},
month = {February},
title = {Scaling Marginalized Importance Sampling to High-Dimensional State-Spaces via State Abstraction},
url = {documents/papers/2023/pavse_2023_absmis.pdf},
year = {2023}
}
@inproceedings{pavse2023rope,
archiveprefix = {arXiv},
author = {Brahma S. Pavse and Josiah P. Hanna},
booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
eprint = {2310.18409},
month = {December},
primaryclass = {cs.LG},
title = {State-Action Similarity-Based Representations for Off-Policy Evaluation},
url = {https://arxiv.org/abs/2310.18409},
year = {2023}
}
@article{pavse2020ridm,
author = {Brahma S. Pavse and Faraz Torabi and Josiah Hanna and Garrett Warnell and Peter Stone},
doi = {10.1109/LRA.2020.3010750},
journal = {IEEE Robotics and Automation Letters (RA-L); IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
month = {July},
title = {Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration},
url = {documents/papers/2020/pavse_2020_ridm.pdf},
year = {2020}
}
@inproceedings{pavse2020psec,
author = {Brahma S. Pavse and Ishan Durugkar and Josiah Hanna and Peter Stone},
booktitle = {Proceedings of the 37th International Conference on Machine Learning (ICML)},
month = {July},
title = {Reducing Sampling Error in Batch Temporal Difference Learning},
url = {documents/papers/2020/pavse_2020_psec.pdf},
year = {2020}
}
@mastersthesis{pavse2020msthesis,
author = {Brahma S. Pavse},
month = {August},
school = {University of Texas at Austin},
title = {Reducing Sampling Error in Batch Temporal Difference Learning},
url = {documents/papers/2020/ms_thesis.pdf},
year = {2020}
}
@bachelorsthesis{pavse2019bsthesis,
author = {Brahma S. Pavse},
month = {May},
school = {University of Texas at Austin},
title = {Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration},
url = {documents/papers/2019/bs_honors_thesis.pdf},
year = {2019}
}