@mastersthesis{zimmer2014masterthesis,
title = {Construction Automatique d’état et d’actions en Apprentissage par Renforcement},
author = {Zimmer, Matthieu},
school = {University Pierre and Marie Curie},
year = {2014}
}
@unpublished{zimmer2012,
title = {Dans quelle mesure un système apprenant peut prendre conscience de ses performances et altérer son comportement},
author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain and Rougier, Nicolas},
note = {Research Report},
year = {2012}
}
@inproceedings{zimmer2014teacher,
title = {Teacher-student framework: a reinforcement learning approach},
author = {Zimmer, Matthieu and Viappiani, Paolo and Weng, Paul},
booktitle = {AAMAS Workshop Autonomous Robots and Multirobot Systems},
year = {2014}
}
@inproceedings{zimmer2016neural,
title = {Neural Fitted Actor-Critic},
author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain},
booktitle = {ESANN - European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning},
year = {2016},
month = {April}
}
@inproceedings{zimmer2016vers,
title = {Vers des architectures acteur-critique neuronales efficaces en donn{\'e}es},
author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain},
booktitle = {Journ{\'e}es Francophones sur la Planification, la D{\'e}cision et l'Apprentissage pour la conduite de syst{\`e}mes},
year = {2016},
month = {July}
}
@inproceedings{zimmer2016toward,
title = {Toward a data efficient neural actor-critic},
author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain},
booktitle = {European Workshop on Reinforcement Learning},
year = {2016},
month = {4 December}
}
@inproceedings{zimmer2016off,
title = {Off-Policy Neural Fitted Actor-Critic},
author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain},
booktitle = {Deep Reinforcement Learning Workshop, NeurIPS 2016},
year = {2016},
month = {10 December}
}
@article{zimmer2017bootstrapping,
title = {Bootstrapping Q-Learning for Robotics from Neuro-Evolution Results},
author = {Zimmer, Matthieu and Doncieux, Stephane},
journal = {IEEE Transactions on Cognitive and Developmental Systems},
year = {2017}
}
@phdthesis{zimmer2018phd,
title = {Apprentissage par renforcement développemental},
author = {Zimmer, Matthieu},
school = {University of Lorraine},
year = {2018},
month = {January}
}
@inproceedings{zimmer2018developmental,
title = {Developmental Reinforcement Learning through Sensorimotor Space Enlargement},
author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain},
booktitle = {The 8th Joint IEEE International Conference on Development and Learning and on Epigenetic Robotics},
year = {2018},
month = {September}
}
@inproceedings{zimmer2019exploiting,
title = {Exploiting the sign of the advantage function to learn deterministic policies in continuous domains},
author = {Zimmer, Matthieu and Weng, Paul},
booktitle = {International Joint Conferences on Artificial Intelligence},
year = {2019},
month = {August}
}
@inproceedings{zimmer2019dai,
author = {Zimmer, Matthieu and Weng, Paul},
booktitle = {Distributed Artificial Intelligence},
title = {An Efficient Reinforcement Learning Algorithm for Learning Deterministic Policies in Continuous Domains},
year = {2019},
month = {September}
}
@inproceedings{lin2019nipsw,
author = {Lin, Yijiong and Huang, Jiancong and Zimmer, Matthieu and Rojas, Juan and Weng, Paul},
title = {Towards More Sample Efficiency in Reinforcement Learning with Data Augmentation},
booktitle = {Robot Learning: Control and Interaction in the Real World - NeurIPS workshop},
year = {2019},
month = {December}
}
@inproceedings{siddique2020icml,
author = {Siddique, Umer and Weng, Paul and Zimmer, Matthieu},
title = {Learning Fair Policies in Multi-Objective Deep Reinforcement Learning with Average and Discounted Rewards},
booktitle = {International Conference on Machine Learning},
year = {2020}
}
@article{lin2020,
author = {Lin, Yijiong and Huang, Jiancong and Zimmer, Matthieu and Rojas, Juan and Weng, Paul},
title = {Invariant Transform Experience Replay},
journal = {IEEE Robotics and Automation Letters},
year = {2020}
}
@inproceedings{huang2020hyperparameter,
title = {Hyperparameter Auto-tuning in Self-Supervised Robotic Learning},
author = {Jiancong Huang and Juan Rojas and Matthieu Zimmer and Hongmin Wu and Yisheng Guan and Paul Weng},
year = {2020},
booktitle = {Deep Reinforcement Learning Workshop - NeurIPS 2020}
}
@article{huang2021hyperparameter,
title = {Hyperparameter Auto-tuning in Self-Supervised Robotic Learning},
author = {Jiancong Huang and Juan Rojas and Matthieu Zimmer and Hongmin Wu and Yisheng Guan and Paul Weng},
journal = {IEEE Robotics and Automation Letters},
year = {2021}
}
@inproceedings{zimmer2021learning,
author = {Zimmer*, Matthieu and Glanois*, Claire and Siddique, Umer and Weng, Paul},
title = {Learning Fair Policies in Decentralized Cooperative Multi-Agent Reinforcement Learning},
booktitle = {International Conference on Machine Learning},
eprint = {2012.09421},
archiveprefix = {arXiv},
primaryclass = {cs.LG},
year = {2021}
}
@inproceedings{zimmer2021diff,
author = {Zimmer, Matthieu and Feng, Xuening and Glanois, Claire and Jiang, Zhaohui and Zhang, Jianyi and Weng, Paul and Dong, Li and Jianye, Hao and Wulong, Liu},
title = {Differentiable Logic Machines},
year = {2021},
eprint = {2102.11529},
archiveprefix = {arXiv},
primaryclass = {cs.LG}
}
This file was generated by bibtex2html 1.99.