@inproceedings{ICAPS20paper116, title = {Joint Inference of Reward Machines and Policies for Reinforcement Learning}, author = {Zhe Xu and Ivan Gavran and Yousef Ahmad and Rupak Majumdar and Daniel Neider and Ufuk Topcu and Bo Wu}, booktitle = {Proceedings of the 30th International Conference on Automated Planning and Scheduling ({ICAPS})}, publisher = {{AAAI} Press}, pages = {590--598}, year = {2020} }