@inproceedings{saber_pesquerel_log_regret_mdp_2024,title={Logarithmic regret in communicating MDPs: Leveraging known dynamics with bandits},author={Saber, Hassan and Pesquerel, Fabien and Maillard, Odalric-Ambrym and Talebi, Mohammad Sadegh},booktitle={Proceedings of the 15th Asian Conference on Machine Learning},pages={1167--1182},year={2024},editor={Yanıkoğlu, Berrin and Buntine, Wray},volume={222},series={Proceedings of Machine Learning Research},month={11--14 Nov},publisher={PMLR},url={https://proceedings.mlr.press/v222/saber24a.html}}
@inproceedings{pesquerel_fast_imed_fimed_2023,author={Baudry, Dorian and Pesquerel, Fabien and Degenne, Rémy and Maillard, Odalric-Ambrym},booktitle={Advances in Neural Information Processing Systems},editor={Oh, A. and Naumann, T. and Globerson, A. and Saenko, K. and Hardt, M. and Levine, S.},pages={11469--11514},publisher={Curran Associates, Inc.},title={Fast Asymptotically Optimal Algorithms for Non-Parametric Stochastic Bandits},url={https://proceedings.neurips.cc/paper_files/paper/2023/file/26300457961c3e056ea61c9d3ebec2a4-Paper-Conference.pdf},volume={36},year={2023}}
PhD thesis
Information per unit of interaction in stochastic sequential decision making
@book{pesquerel_phd_thesis_information_per_unit_of_interaction_2023,title={Information per unit of interaction in stochastic sequential decision making},author={Pesquerel, Fabien},year={2023},month=dec,url={https://cnrs.hal.science/tel-04501905/},}
@inproceedings{pesquerel_imedrl_2022,author={Pesquerel, Fabien and Maillard, Odalric-Ambrym},booktitle={Advances in Neural Information Processing Systems},editor={Koyejo, S. and Mohamed, S. and Agarwal, A. and Belgrave, D. and Cho, K. and Oh, A.},pages={26363--26374},publisher={Curran Associates, Inc.},title={IMED-RL: Regret optimal learning of ergodic Markov decision processes},url={https://proceedings.neurips.cc/paper_files/paper/2022/file/a8c9f9ccc45771d2fd06bcd04ff3442e-Paper-Conference.pdf},volume={35},year={2022},}
@inproceedings{pesquerel_bandits_group_similar_arms_2021,author={Pesquerel, Fabien and Saber, Hassan and Maillard, Odalric-Ambrym},booktitle={Advances in Neural Information Processing Systems},editor={Ranzato, M. and Beygelzimer, A. and Dauphin, Y. and Liang, P.S. and Vaughan, J. Wortman},pages={19461--19472},publisher={Curran Associates, Inc.},title={Stochastic bandits with groups of similar arms.},url={https://proceedings.neurips.cc/paper_files/paper/2021/file/a22c0238589078fb10b606ab62015744-Paper.pdf},volume={34},year={2021}}