@mastersthesis{zimmer2014masterthesis, title = {Construction Automatique d’état et d’actions en Apprentissage par Renforcement}, author = {Zimmer, Matthieu}, school = {University Pierre and Marie Curie}, year = {2014} }
@unpublished{zimmer2012, title = {Dans quelle mesure un système apprenant peut prendre conscience de ses performances et altérer son comportement}, author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain and Rougier, Nicolas}, note = {Research Report}, year = {2012} }
@inproceedings{zimmer2014teacher, title = {Teacher-student framework: a reinforcement learning approach}, author = {Zimmer, Matthieu and Viappiani, Paolo and Weng, Paul}, booktitle = {AAMAS Workshop Autonomous Robots and Multirobot Systems}, year = {2014} }
@inproceedings{zimmer2016neural, title = {Neural Fitted Actor-Critic}, author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain}, booktitle = {ESANN - European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning}, year = {2016}, month = {April} }
@inproceedings{zimmer2016vers, title = {Vers des architectures acteur-critique neuronales efficaces en donn{\'e}es}, author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain}, booktitle = {Journ{\'e}es Francophones sur la Planification, la D{\'e}cision et l'Apprentissage pour la conduite de syst{\`e}mes}, year = {2016}, month = {July} }
@inproceedings{zimmer2016toward, title = {Toward a data efficient neural actor-critic}, author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain}, booktitle = {European Workshop on Reinforcement Learning}, year = {2016}, month = {4 December} }
@inproceedings{zimmer2016off, title = {Off-Policy Neural Fitted Actor-Critic}, author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain}, booktitle = {Deep Reinforcement Learning Workshop, NeurIPS 2016}, year = {2016}, month = {10 December} }
@article{zimmer2017bootstrapping, title = {Bootstrapping Q-Learning for Robotics from Neuro-Evolution Results}, author = {Zimmer, Matthieu and Doncieux, Stephane}, journal = {IEEE Transactions on Cognitive and Developmental Systems}, year = {2017} }
@phdthesis{zimmer2018phd, title = {Apprentissage par renforcement développemental}, author = {Zimmer, Matthieu}, school = {University of Lorraine}, year = {2018}, month = {January} }
@inproceedings{zimmer2018developmental, title = {Developmental Reinforcement Learning through Sensorimotor Space Enlargement}, author = {Zimmer, Matthieu and Boniface, Yann and Dutech, Alain}, booktitle = {The 8th Joint IEEE International Conference on Development and Learning and on Epigenetic Robotics}, year = {2018}, month = {September} }
@inproceedings{zimmer2019exploiting, title = {Exploiting the sign of the advantage function to learn deterministic policies in continuous domains}, author = {Zimmer, Matthieu and Weng, Paul}, booktitle = {International Joint Conferences on Artificial Intelligence}, year = {2019}, month = {August} }
@inproceedings{zimmer2019dai, author = {Zimmer, Matthieu and Weng, Paul}, booktitle = {Distributed Artificial Intelligence}, title = {An Efficient Reinforcement Learning Algorithm for Learning Deterministic Policies in Continuous Domains}, year = {2019}, month = {September} }
@inproceedings{lin2019nipsw, author = {Lin, Yijiong and Huang, Jiancong and Zimmer, Matthieu and Rojas, Juan and Weng, Paul}, title = {Towards More Sample Efficiency in Reinforcement Learning with Data Augmentation}, booktitle = {Robot Learning: Control and Interaction in the Real World - NeurIPS workshop}, year = {2019}, month = {December} }
@inproceedings{siddique2020icml, author = {Siddique, Umer and Weng, Paul and Zimmer, Matthieu}, title = {Learning Fair Policies in Multi-Objective Deep Reinforcement Learning with Average and Discounted Rewards}, booktitle = {International Conference on Machine Learning}, year = {2020} }
@article{lin2020, author = {Lin, Yijiong and Huang, Jiancong and Zimmer, Matthieu and Rojas, Juan and Weng, Paul}, title = {Invariant Transform Experience Replay}, journal = {IEEE Robotics and Automation Letters}, year = {2020} }
@inproceedings{huang2020hyperparameter, title = {Hyperparameter Auto-tuning in Self-Supervised Robotic Learning}, author = {Jiancong Huang and Juan Rojas and Matthieu Zimmer and Hongmin Wu and Yisheng Guan and Paul Weng}, year = {2020}, booktitle = {Deep Reinforcement Learning Workshop - NeurIPS 2020} }
@article{huang2021hyperparameter, title = {Hyperparameter Auto-tuning in Self-Supervised Robotic Learning}, author = {Jiancong Huang and Juan Rojas and Matthieu Zimmer and Hongmin Wu and Yisheng Guan and Paul Weng}, journal = {IEEE Robotics and Automation Letters}, year = {2021} }
@inproceedings{zimmer2021learning, author = {Zimmer*, Matthieu and Glanois*, Claire and Siddique, Umer and Weng, Paul}, title = {Learning Fair Policies in Decentralized Cooperative Multi-Agent Reinforcement Learning}, booktitle = {International Conference on Machine Learning}, eprint = {2012.09421}, archiveprefix = {arXiv}, primaryclass = {cs.LG}, year = {2021} }
@inproceedings{zimmer2021diff, author = {Zimmer, Matthieu and Feng, Xuening and Glanois, Claire and Jiang, Zhaohui and Zhang, Jianyi and Weng, Paul and Dong, Li and Jianye, Hao and Wulong, Liu}, title = {Differentiable Logic Machines}, year = {2021}, eprint = {2102.11529}, archiveprefix = {arXiv}, primaryclass = {cs.LG} }
This file was generated by bibtex2html 1.99.