@inproceedings{69b6799eb3be4adba443237d1c3d6357,
title = "Provable representation learning for imitation learning via bi-level optimization",
abstract = "A common strategy in modern learning systems is to learn a representation that is useful for many tasks, a.k.a. representation learning. We study this strategy in the imitation learning setting for Markov decision processes (MDPs) where multiple experts trajectories are available. We formulate representation learning as a bi-level optimization problem where the {"}outer{"} optimization tries to learn the joint representation and the {"}inner{"} optimization encodes the imitation learning setup and tries to learn task-specific parameters. We instantiate this framework for the imitation learning settings of behavior cloning and observationalone. Theoretically, we show using our framework that representation learning can provide sample complexity benefits for imitation learning in both settings. We also provide proof-of-concept experiments to verify our theory.",
author = "Sanjeev Arora and Du, {Simon S.} and Sham Kakade and Yuping Luo and Nikunj Saunshi",
note = "Publisher Copyright: {\textcopyright} ICML 2020. All rights reserved.; 37th International Conference on Machine Learning, ICML 2020 ; Conference date: 13-07-2020 Through 18-07-2020",
year = "2020",
language = "English (US)",
series = "37th International Conference on Machine Learning, ICML 2020",
publisher = "International Machine Learning Society (IMLS)",
pages = "344--353",
editor = "Hal Daume and Aarti Singh",
booktitle = "37th International Conference on Machine Learning, ICML 2020",
}