2024 The 2023 International Planning Competition Ayal Taitler, Ron Alford, Joan Espasa, Gregor Behnke, Daniel Fišer, Michael Gimelfarb, Florian Pommerening, Scott Sanner, Enrico Scala, Dominik Schreiber, and others AI Magazine, 2024 Bib HTML PDF @article{taitler20242023, title = {The 2023 International Planning Competition}, author = {Taitler, Ayal and Alford, Ron and Espasa, Joan and Behnke, Gregor and Fi{\v{s}}er, Daniel and Gimelfarb, Michael and Pommerening, Florian and Sanner, Scott and Scala, Enrico and Schreiber, Dominik and others}, journal = {AI Magazine}, year = {2024}, } JaxPlan and GurobiPlan: Optimization Baselines for Replanning in Discrete and Mixed Discrete-Continuous Probabilistic Domains Michael Gimelfarb, Ayal Taitler, and Scott Sanner In Proceedings of the International Conference on Automated Planning and Scheduling, 2024 Bib HTML PDF Code @inproceedings{gimelfarb2024jaxplan, title = {JaxPlan and GurobiPlan: Optimization Baselines for Replanning in Discrete and Mixed Discrete-Continuous Probabilistic Domains}, author = {Gimelfarb, Michael and Taitler, Ayal and Sanner, Scott}, booktitle = {Proceedings of the International Conference on Automated Planning and Scheduling}, year = {2024}, } Constraint-Generation Policy Optimization (CGPO): Nonlinear Programming for Policy Optimization in Mixed Discrete-Continuous MDPs Michael Gimelfarb, Ayal Taitler, and Scott Sanner arXiv preprint, 2024 HTML PDF ModelDiff: Leveraging Models for Policy Transfer with Value Lower Bounds Xiaotian Liu, Jihwan Jeong, Ayal Taitler, Michael Gimelfarb, and Scott Sanner In PRL Workshop Series: Bridging the Gap Between AI Planning and Reinforcement Learning, 2024 Bib HTML PDF @inproceedings{liu2024modeldiff, title = {ModelDiff: Leveraging Models for Policy Transfer with Value Lower Bounds}, author = {Liu, Xiaotian and Jeong, Jihwan and Taitler, Ayal and Gimelfarb, Michael and Sanner, Scott}, booktitle = {PRL Workshop Series: Bridging the Gap Between AI Planning and Reinforcement Learning}, year = {2024}, } 2023 Conservative bayesian model-based value expansion for offline policy optimization Jihwan Jeong, Xiaoyu Wang, Michael Gimelfarb, Hyunwoo Kim, Baher Abdulhai, and Scott Sanner In International Conference on Learning Representations, 2023 Bib HTML PDF Code @inproceedings{jeong2023conservative, title = {Conservative bayesian model-based value expansion for offline policy optimization}, author = {Jeong, Jihwan and Wang, Xiaoyu and Gimelfarb, Michael and Kim, Hyunwoo and Abdulhai, Baher and Sanner, Scott}, booktitle = {International Conference on Learning Representations}, year = {2023}, } pyRDDLGym: From RDDL to Gym Environments Ayal Taitler, Michael Gimelfarb, Jihwan Jeong, Sriram Gopalakrishnan, Martin Mladenov, Xiaotian Liu, and Scott Sanner In PRL Workshop Series: Bridging the Gap Between AI Planning and Reinforcement Learning, 2023 Bib HTML PDF Code @inproceedings{taitler2023pyrddlgym, title = {pyRDDLGym: From RDDL to Gym Environments}, author = {Taitler, Ayal and Gimelfarb, Michael and Jeong, Jihwan and Gopalakrishnan, Sriram and Mladenov, Martin and Liu, Xiaotian and Sanner, Scott}, booktitle = {PRL Workshop Series: Bridging the Gap Between AI Planning and Reinforcement Learning}, year = {2023}, } Thompson Sampling for Parameterized Markov Decision Processes with Uninformative Actions Michael Gimelfarb, and Michael Jong Kim arXiv preprint arXiv:2305.07844, 2023 HTML PDF 2022 A Distributional Framework for Risk-Sensitive End-to-End Planning in Continuous MDPs Noah Patton, Jihwan Jeong, Michael Gimelfarb, and Scott Sanner In Proceedings of the AAAI Conference on Artificial Intelligence, 2022 Bib HTML PDF @inproceedings{patton2022distributional, title = {A Distributional Framework for Risk-Sensitive End-to-End Planning in Continuous MDPs}, author = {Patton, Noah and Jeong, Jihwan and Gimelfarb, Michael and Sanner, Scott}, booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence}, year = {2022}, } 2021 Contextual policy transfer in reinforcement learning domains via deep mixtures-of-experts Michael Gimelfarb, Scott Sanner, and Chi-Guhn Lee In Uncertainty in Artificial Intelligence, 2021 Bib HTML PDF @inproceedings{gimelfarb2021contextual, title = {Contextual policy transfer in reinforcement learning domains via deep mixtures-of-experts}, author = {Gimelfarb, Michael and Sanner, Scott and Lee, Chi-Guhn}, booktitle = {Uncertainty in Artificial Intelligence}, year = {2021}, } Bayesian experience reuse for learning from multiple demonstrators Michael Gimelfarb, Scott Sanner, and Chi-Guhn Lee In International Joint Conference on Artificial Intelligence, 2021 Bib HTML PDF @inproceedings{gimelfarb2021bayesian, title = {Bayesian experience reuse for learning from multiple demonstrators}, author = {Gimelfarb, Michael and Sanner, Scott and Lee, Chi-Guhn}, booktitle = {International Joint Conference on Artificial Intelligence}, year = {2021}, } Risk-aware transfer in reinforcement learning using successor features Michael Gimelfarb , André Barreto, Scott Sanner, and Chi-Guhn Lee In Advances in Neural Information Processing Systems, 2021 Bib HTML PDF @inproceedings{gimelfarb2021risk, title = {Risk-aware transfer in reinforcement learning using successor features}, author = {Gimelfarb, Michael and Barreto, Andr{\'e} and Sanner, Scott and Lee, Chi-Guhn}, booktitle = {Advances in Neural Information Processing Systems}, year = {2021}, } 2020 Epsilon-BMC: A Bayesian Ensemble Approach to Epsilon-Greedy Exploration in Model-Free Reinforcement Learning Michael Gimelfarb, Scott Sanner, and Chi-Guhn Lee In Uncertainty in Artificial Intelligence, 2020 Bib HTML PDF Code @inproceedings{gimelfarb2020epsilon, title = {Epsilon-BMC: A Bayesian Ensemble Approach to Epsilon-Greedy Exploration in Model-Free Reinforcement Learning}, author = {Gimelfarb, Michael and Sanner, Scott and Lee, Chi-Guhn}, booktitle = {Uncertainty in Artificial Intelligence}, year = {2020}, } 2018 Reinforcement learning with multiple experts: A bayesian model combination approach Michael Gimelfarb, Scott Sanner, and Chi-Guhn Lee In Advances in neural information processing systems, 2018 Bib HTML PDF Code @inproceedings{gimelfarb2018reinforcement, title = {Reinforcement learning with multiple experts: A bayesian model combination approach}, author = {Gimelfarb, Michael and Sanner, Scott and Lee, Chi-Guhn}, booktitle = {Advances in neural information processing systems}, year = {2018}, }