publications | Fabien Pesquerel

2024

Logarithmic regret in communicating MDPs: Leveraging known dynamics with bandits

Hassan Saber, Fabien Pesquerel, Odalric-Ambrym Maillard, and 1 more author

In Proceedings of the 15th Asian Conference on Machine Learning, 11–14 nov 2024

@inproceedings{saber_pesquerel_log_regret_mdp_2024,
  title = {Logarithmic regret in communicating MDPs: Leveraging known dynamics with bandits},
  author = {Saber, Hassan and Pesquerel, Fabien and Maillard, Odalric-Ambrym and Talebi, Mohammad Sadegh},
  booktitle = {Proceedings of the 15th Asian Conference on Machine Learning},
  pages = {1167--1182},
  year = {2024},
  editor = {Yanıkoğlu, Berrin and Buntine, Wray},
  volume = {222},
  series = {Proceedings of Machine Learning Research},
  month = {11--14 Nov},
  publisher = {PMLR},
  url = {https://proceedings.mlr.press/v222/saber24a.html}
}

2023

NeurIPS

Fast Asymptotically Optimal Algorithms for Non-Parametric Stochastic Bandits

Dorian Baudry, Fabien Pesquerel, Rémy Degenne, and 1 more author

In Advances in Neural Information Processing Systems, 11–14 nov 2023

Bib HTML PDF

@inproceedings{pesquerel_fast_imed_fimed_2023,
  author = {Baudry, Dorian and Pesquerel, Fabien and Degenne, Rémy and Maillard, Odalric-Ambrym},
  booktitle = {Advances in Neural Information Processing Systems},
  editor = {Oh, A. and Naumann, T. and Globerson, A. and Saenko, K. and Hardt, M. and Levine, S.},
  pages = {11469--11514},
  publisher = {Curran Associates, Inc.},
  title = {Fast Asymptotically Optimal Algorithms for Non-Parametric Stochastic Bandits},
  url = {https://proceedings.neurips.cc/paper_files/paper/2023/file/26300457961c3e056ea61c9d3ebec2a4-Paper-Conference.pdf},
  volume = {36},
  year = {2023}
}

PhD thesis

Information per unit of interaction in stochastic sequential decision making

Fabien Pesquerel

Dec 2023

Bib HTML PDF

@book{pesquerel_phd_thesis_information_per_unit_of_interaction_2023,
  title = {Information per unit of interaction in stochastic sequential decision making},
  author = {Pesquerel, Fabien},
  year = {2023},
  month = dec,
  url = {https://cnrs.hal.science/tel-04501905/},
}

2022

NeurIPS

IMED-RL: Regret optimal learning of ergodic Markov decision processes

Fabien Pesquerel, and Odalric-Ambrym Maillard

In Advances in Neural Information Processing Systems, Dec 2022

Bib HTML PDF

@inproceedings{pesquerel_imedrl_2022,
  author = {Pesquerel, Fabien and Maillard, Odalric-Ambrym},
  booktitle = {Advances in Neural Information Processing Systems},
  editor = {Koyejo, S. and Mohamed, S. and Agarwal, A. and Belgrave, D. and Cho, K. and Oh, A.},
  pages = {26363--26374},
  publisher = {Curran Associates, Inc.},
  title = {IMED-RL: Regret optimal learning of ergodic Markov decision processes},
  url = {https://proceedings.neurips.cc/paper_files/paper/2022/file/a8c9f9ccc45771d2fd06bcd04ff3442e-Paper-Conference.pdf},
  volume = {35},
  year = {2022},
}

2021

NeurIPS

Stochastic bandits with groups of similar arms.

Fabien Pesquerel, Hassan Saber, and Odalric-Ambrym Maillard

In Advances in Neural Information Processing Systems, Dec 2021

Bib HTML PDF

@inproceedings{pesquerel_bandits_group_similar_arms_2021,
  author = {Pesquerel, Fabien and Saber, Hassan and Maillard, Odalric-Ambrym},
  booktitle = {Advances in Neural Information Processing Systems},
  editor = {Ranzato, M. and Beygelzimer, A. and Dauphin, Y. and Liang, P.S. and Vaughan, J. Wortman},
  pages = {19461--19472},
  publisher = {Curran Associates, Inc.},
  title = {Stochastic bandits with groups of similar arms.},
  url = {https://proceedings.neurips.cc/paper_files/paper/2021/file/a22c0238589078fb10b606ab62015744-Paper.pdf},
  volume = {34},
  year = {2021}
}