@inproceedings{lawrence-etal-2017-counterfactual, title = "Counterfactual Learning from Bandit Feedback under Deterministic Logging : A Case Study in Statistical Machine Translation", author = "Lawrence, Carolin and Sokolov, Artem and Riezler, Stefan", editor = "Palmer, Martha and Hwa, Rebecca and Riedel, Sebastian", booktitle = "Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing", month = sep, year = "2017", address = "Copenhagen, Denmark", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/landing_page/D17-1272/", doi = "10.18653/v1/D17-1272", pages = "2566--2576" }