@article{biyik2020learning, title={Learning reward functions from diverse sources of human feedback: Optimally integrating demonstrations and preferences}, author={B{\i}y{\i}k, Erdem and Losey, Dylan P and Palan, Malayandi and Landolfi, Nicholas C and Shevchuk, Gleb and Sadigh, Dorsa}, journal={arXiv preprint arXiv:2006.14091}, year={2020} }