2024 ACML Logarithmic regret in communicating MDPs: Leveraging known dynamics with bandits Hassan Saber, Fabien Pesquerel, Odalric-Ambrym Maillard, and 1 more author In Proceedings of the 15th Asian Conference on Machine Learning, 11–14 nov 2024 Bib HTML PDF @inproceedings{saber_pesquerel_log_regret_mdp_2024, title = {Logarithmic regret in communicating MDPs: Leveraging known dynamics with bandits}, author = {Saber, Hassan and Pesquerel, Fabien and Maillard, Odalric-Ambrym and Talebi, Mohammad Sadegh}, booktitle = {Proceedings of the 15th Asian Conference on Machine Learning}, pages = {1167--1182}, year = {2024}, editor = {Yanıkoğlu, Berrin and Buntine, Wray}, volume = {222}, series = {Proceedings of Machine Learning Research}, month = {11--14 Nov}, publisher = {PMLR}, url = {https://proceedings.mlr.press/v222/saber24a.html} } 2023 NeurIPS Fast Asymptotically Optimal Algorithms for Non-Parametric Stochastic Bandits Dorian Baudry, Fabien Pesquerel, Rémy Degenne, and 1 more author In Advances in Neural Information Processing Systems, 11–14 nov 2023 Bib HTML PDF @inproceedings{pesquerel_fast_imed_fimed_2023, author = {Baudry, Dorian and Pesquerel, Fabien and Degenne, Rémy and Maillard, Odalric-Ambrym}, booktitle = {Advances in Neural Information Processing Systems}, editor = {Oh, A. and Naumann, T. and Globerson, A. and Saenko, K. and Hardt, M. and Levine, S.}, pages = {11469--11514}, publisher = {Curran Associates, Inc.}, title = {Fast Asymptotically Optimal Algorithms for Non-Parametric Stochastic Bandits}, url = {https://proceedings.neurips.cc/paper_files/paper/2023/file/26300457961c3e056ea61c9d3ebec2a4-Paper-Conference.pdf}, volume = {36}, year = {2023} } PhD thesis Information per unit of interaction in stochastic sequential decision making Fabien Pesquerel Dec 2023 Bib HTML PDF @book{pesquerel_phd_thesis_information_per_unit_of_interaction_2023, title = {Information per unit of interaction in stochastic sequential decision making}, author = {Pesquerel, Fabien}, year = {2023}, month = dec, url = {https://cnrs.hal.science/tel-04501905/}, } 2022 NeurIPS IMED-RL: Regret optimal learning of ergodic Markov decision processes Fabien Pesquerel, and Odalric-Ambrym Maillard In Advances in Neural Information Processing Systems, Dec 2022 Bib HTML PDF @inproceedings{pesquerel_imedrl_2022, author = {Pesquerel, Fabien and Maillard, Odalric-Ambrym}, booktitle = {Advances in Neural Information Processing Systems}, editor = {Koyejo, S. and Mohamed, S. and Agarwal, A. and Belgrave, D. and Cho, K. and Oh, A.}, pages = {26363--26374}, publisher = {Curran Associates, Inc.}, title = {IMED-RL: Regret optimal learning of ergodic Markov decision processes}, url = {https://proceedings.neurips.cc/paper_files/paper/2022/file/a8c9f9ccc45771d2fd06bcd04ff3442e-Paper-Conference.pdf}, volume = {35}, year = {2022}, } 2021 NeurIPS Stochastic bandits with groups of similar arms. Fabien Pesquerel, Hassan Saber, and Odalric-Ambrym Maillard In Advances in Neural Information Processing Systems, Dec 2021 Bib HTML PDF @inproceedings{pesquerel_bandits_group_similar_arms_2021, author = {Pesquerel, Fabien and Saber, Hassan and Maillard, Odalric-Ambrym}, booktitle = {Advances in Neural Information Processing Systems}, editor = {Ranzato, M. and Beygelzimer, A. and Dauphin, Y. and Liang, P.S. and Vaughan, J. Wortman}, pages = {19461--19472}, publisher = {Curran Associates, Inc.}, title = {Stochastic bandits with groups of similar arms.}, url = {https://proceedings.neurips.cc/paper_files/paper/2021/file/a22c0238589078fb10b606ab62015744-Paper.pdf}, volume = {34}, year = {2021} }