@InProceedings{jerbi_et_al:LIPIcs.TQC.2023.13, author = {Jerbi, Sofiene and Cornelissen, Arjan and Ozols, Maris and Dunjko, Vedran}, title = {{Quantum Policy Gradient Algorithms}}, booktitle = {18th Conference on the Theory of Quantum Computation, Communication and Cryptography (TQC 2023)}, pages = {13:1--13:24}, series = {Leibniz International Proceedings in Informatics (LIPIcs)}, ISBN = {978-3-95977-283-9}, ISSN = {1868-8969}, year = {2023}, volume = {266}, editor = {Fawzi, Omar and Walter, Michael}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.TQC.2023.13}, URN = {urn:nbn:de:0030-drops-183230}, doi = {10.4230/LIPIcs.TQC.2023.13}, annote = {Keywords: quantum reinforcement learning, policy gradient methods, parametrized quantum circuits} }