Publications

More information available on my Google Scholar profile.

2025

Stable Offline Value Function Learning with Bisimulation-based Representations
Brahma S. Pavse, Yudong Chen, Qiaomin Xie, Josiah P. Hanna
Proceedings of the 42nd International Conference on Machine Learning (ICML), 2025

PDF Cite

@inproceedings{pavse2025stable,
 archiveprefix = {arXiv},
 author = {Brahma S. Pavse and Yudong Chen and Qiaomin Xie and Josiah P. Hanna},
 booktitle = {Proceedings of the 42nd International Conference on Machine Learning (ICML)},
 eprint = {2410.01643},
 month = {July},
 primaryclass = {cs.LG},
 title = {Stable Offline Value Function Learning with Bisimulation-based Representations},
 url = {https://arxiv.org/abs/2410.01643},
 year = {2025}
}

2024

Learning to Stabilize Online Reinforcement Learning in Unbounded State Spaces
Brahma S. Pavse, Matthew Zurek, Yudong Chen, Qiaomin Xie, Josiah P. Hanna
Proceedings of the 41st International Conference on Machine Learning (ICML), 2024

PDF Code Cite

@inproceedings{pavse2024stabilize,
 archiveprefix = {arXiv},
 author = {Brahma S. Pavse and Matthew Zurek and Yudong Chen and Qiaomin Xie and Josiah P. Hanna},
 booktitle = {Proceedings of the 41st International Conference on Machine Learning (ICML)},
 eprint = {2306.01896},
 month = {July},
 primaryclass = {cs.LG},
 title = {Learning to Stabilize Online Reinforcement Learning in Unbounded State Spaces},
 url = {https://arxiv.org/abs/2306.01896},
 year = {2024}
}

2023

Scaling Marginalized Importance Sampling to High-Dimensional State-Spaces via State Abstraction
Brahma S. Pavse, Josiah P. Hanna
Proceedings of the 37th AAAI Conference on Artificial Intelligence (AAAI), 2023

PDF Cite

@inproceedings{pavse2023absmis,
 address = {Washington, DC, USA},
 author = {Brahma S. Pavse and Josiah P. Hanna},
 booktitle = {Proceedings of the 37th AAAI Conference on Artificial Intelligence (AAAI)},
 month = {February},
 title = {Scaling Marginalized Importance Sampling to High-Dimensional State-Spaces via State Abstraction},
 url = {documents/papers/2023/pavse_2023_absmis.pdf},
 year = {2023}
}

State-Action Similarity-Based Representations for Off-Policy Evaluation
Brahma S. Pavse, Josiah P. Hanna
Advances in Neural Information Processing Systems (NeurIPS), 2023

PDF Code Cite

@inproceedings{pavse2023rope,
 archiveprefix = {arXiv},
 author = {Brahma S. Pavse and Josiah P. Hanna},
 booktitle = {Advances in Neural Information Processing Systems (NeurIPS)},
 eprint = {2310.18409},
 month = {December},
 primaryclass = {cs.LG},
 title = {State-Action Similarity-Based Representations for Off-Policy Evaluation},
 url = {https://arxiv.org/abs/2310.18409},
 year = {2023}
}

2020

Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration
Brahma S. Pavse, Faraz Torabi, Josiah Hanna, Garrett Warnell, Peter Stone
IEEE Robotics and Automation Letters (RA-L); IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS), 2020

PDF DOI Cite

@article{pavse2020ridm,
 author = {Brahma S. Pavse and Faraz Torabi and Josiah Hanna and Garrett Warnell and Peter Stone},
 doi = {10.1109/LRA.2020.3010750},
 journal = {IEEE Robotics and Automation Letters (RA-L); IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)},
 month = {July},
 title = {Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration},
 url = {documents/papers/2020/pavse_2020_ridm.pdf},
 year = {2020}
}

Reducing Sampling Error in Batch Temporal Difference Learning
Brahma S. Pavse, Ishan Durugkar, Josiah Hanna, Peter Stone
Proceedings of the 37th International Conference on Machine Learning (ICML), 2020

PDF Cite

@inproceedings{pavse2020psec,
 author = {Brahma S. Pavse and Ishan Durugkar and Josiah Hanna and Peter Stone},
 booktitle = {Proceedings of the 37th International Conference on Machine Learning (ICML)},
 month = {July},
 title = {Reducing Sampling Error in Batch Temporal Difference Learning},
 url = {documents/papers/2020/pavse_2020_psec.pdf},
 year = {2020}
}

Reducing Sampling Error in Batch Temporal Difference Learning
Brahma S. Pavse
, 2020

PDF Cite

@mastersthesis{pavse2020msthesis,
 author = {Brahma S. Pavse},
 month = {August},
 school = {University of Texas at Austin},
 title = {Reducing Sampling Error in Batch Temporal Difference Learning},
 url = {documents/papers/2020/ms_thesis.pdf},
 year = {2020}
}

2019

Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration
Brahma S. Pavse
, 2019

PDF Cite

@bachelorsthesis{pavse2019bsthesis,
 author = {Brahma S. Pavse},
 month = {May},
 school = {University of Texas at Austin},
 title = {Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration},
 url = {documents/papers/2019/bs_honors_thesis.pdf},
 year = {2019}
}