iBet uBet web content aggregator. Adding the entire web to your favor.
iBet uBet web content aggregator. Adding the entire web to your favor.



Link to original content: https://dblp.dagstuhl.de/pid/54/6742-1.bib
@article{DBLP:journals/corr/abs-2404-10017, author = {Simon Eisenmann and Daniel Hein and Steffen Udluft and Thomas A. Runkler}, title = {Model-based Offline Quantum Reinforcement Learning}, journal = {CoRR}, volume = {abs/2404.10017}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2404.10017}, doi = {10.48550/ARXIV.2404.10017}, eprinttype = {arXiv}, eprint = {2404.10017}, timestamp = {Fri, 31 May 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2404-10017.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-2407-11751, author = {Philipp Wissmann and Daniel Hein and Steffen Udluft and Volker Tresp}, title = {Why long model-based rollouts are no reason for bad Q-value estimates}, journal = {CoRR}, volume = {abs/2407.11751}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2407.11751}, doi = {10.48550/ARXIV.2407.11751}, eprinttype = {arXiv}, eprint = {2407.11751}, timestamp = {Fri, 23 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2407-11751.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/tmlr/WiedemannHUM23, author = {Simon Wiedemann and Daniel Hein and Steffen Udluft and Christian B. Mendl}, title = {Quantum Policy Iteration via Amplitude Estimation and Grover Search - Towards Quantum Advantage for Reinforcement Learning}, journal = {Trans. Mach. Learn. Res.}, volume = {2023}, year = {2023}, url = {https://openreview.net/forum?id=HG11PAmwQ6}, timestamp = {Thu, 18 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tmlr/WiedemannHUM23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/qce/TrespUHHLMSM23, author = {Volker Tresp and Steffen Udluft and Daniel Hein and Werner Hauptmann and Martin Leib and Christopher Mutschler and Daniel D. Scherer and Wolfgang Mauerer}, editor = {Brian La Cour and Lia Yeh and Marek Osinski}, title = {Workshop Summary: Quantum Machine Learning}, booktitle = {{IEEE} International Conference on Quantum Computing and Engineering, {QCE} 2023, Bellevue, WA, USA, September 17-22, 2023}, pages = {1--3}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/QCE57702.2023.10174}, doi = {10.1109/QCE57702.2023.10174}, timestamp = {Fri, 15 Dec 2023 20:24:40 +0100}, biburl = {https://dblp.org/rec/conf/qce/TrespUHHLMSM23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/ssci/WeberSHUS23, author = {Marc Weber and Phillip Swazinna and Daniel Hein and Steffen Udluft and Volkmar Sterzing}, title = {Learning Control Policies for Variable Objectives from Offline Data}, booktitle = {{IEEE} Symposium Series on Computational Intelligence, {SSCI} 2023, Mexico City, Mexico, December 5-8, 2023}, pages = {1674--1681}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/SSCI52147.2023.10371978}, doi = {10.1109/SSCI52147.2023.10371978}, timestamp = {Mon, 15 Jan 2024 21:26:31 +0100}, biburl = {https://dblp.org/rec/conf/ssci/WeberSHUS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-2308-06127, author = {Marc Weber and Phillip Swazinna and Daniel Hein and Steffen Udluft and Volkmar Sterzing}, title = {Learning Control Policies for Variable Objectives from Offline Data}, journal = {CoRR}, volume = {abs/2308.06127}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.06127}, doi = {10.48550/ARXIV.2308.06127}, eprinttype = {arXiv}, eprint = {2308.06127}, timestamp = {Wed, 23 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-06127.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/atal/MeessGHSE22, author = {Henri Meess and Jeremias Gerner and Daniel Hein and Stefanie Schmidtner and Gordon Elger}, editor = {Piotr Faliszewski and Viviana Mascardi and Catherine Pelachaud and Matthew E. Taylor}, title = {Reinforcement Learning for Traffic Signal Control Optimization: {A} Concept for Real-World Implementation}, booktitle = {21st International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2022, Auckland, New Zealand, May 9-13, 2022}, pages = {1699--1701}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems {(IFAAMAS)}}, year = {2022}, url = {https://www.ifaamas.org/Proceedings/aamas2022/pdfs/p1699.pdf}, doi = {10.5555/3535850.3536081}, timestamp = {Mon, 18 Jul 2022 17:13:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/MeessGHSE22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-2201-05433, author = {Phillip Swazinna and Steffen Udluft and Daniel Hein and Thomas A. Runkler}, title = {Comparing Model-free and Model-based Algorithms for Offline Reinforcement Learning}, journal = {CoRR}, volume = {abs/2201.05433}, year = {2022}, url = {https://arxiv.org/abs/2201.05433}, eprinttype = {arXiv}, eprint = {2201.05433}, timestamp = {Thu, 20 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-05433.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-2206-04741, author = {Simon Wiedemann and Daniel Hein and Steffen Udluft and Christian B. Mendl}, title = {Quantum Policy Iteration via Amplitude Estimation and Grover Search - Towards Quantum Advantage for Reinforcement Learning}, journal = {CoRR}, volume = {abs/2206.04741}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.04741}, doi = {10.48550/ARXIV.2206.04741}, eprinttype = {arXiv}, eprint = {2206.04741}, timestamp = {Thu, 18 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-04741.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/esann/SwazinnaU0R21, author = {Phillip Swazinna and Steffen Udluft and Daniel Hein and Thomas A. Runkler}, title = {Behavior Constraining in Weight Space for Offline Reinforcement Learning}, booktitle = {29th European Symposium on Artificial Neural Networks, Computational Intelligence and Machine Learning, {ESANN} 2021, Online event (Bruges, Belgium), October 6-8, 2021}, year = {2021}, url = {https://doi.org/10.14428/esann/2021.ES2021-83}, doi = {10.14428/ESANN/2021.ES2021-83}, timestamp = {Tue, 31 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/esann/SwazinnaU0R21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/gecco/0001L21, author = {Daniel Hein and Daniel Labisch}, editor = {Krzysztof Krawiec}, title = {Trustworthy {AI} for process automation on a Chylla-Haase polymerization reactor}, booktitle = {{GECCO} '21: Genetic and Evolutionary Computation Conference, Companion Volume, Lille, France, July 10-14, 2021}, pages = {1570--1578}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3449726.3463131}, doi = {10.1145/3449726.3463131}, timestamp = {Sat, 09 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/gecco/0001L21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-2107-05479, author = {Phillip Swazinna and Steffen Udluft and Daniel Hein and Thomas A. Runkler}, title = {Behavior Constraining in Weight Space for Offline Reinforcement Learning}, journal = {CoRR}, volume = {abs/2107.05479}, year = {2021}, url = {https://arxiv.org/abs/2107.05479}, eprinttype = {arXiv}, eprint = {2107.05479}, timestamp = {Tue, 20 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-05479.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-2108-13381, author = {Daniel Hein and Daniel Labisch}, title = {Trustworthy {AI} for Process Automation on a Chylla-Haase Polymerization Reactor}, journal = {CoRR}, volume = {abs/2108.13381}, year = {2021}, url = {https://arxiv.org/abs/2108.13381}, eprinttype = {arXiv}, eprint = {2108.13381}, timestamp = {Fri, 03 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-13381.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-2007-09964, author = {Daniel Hein and Steffen Limmer and Thomas A. Runkler}, title = {Interpretable Control by Reinforcement Learning}, journal = {CoRR}, volume = {abs/2007.09964}, year = {2020}, url = {https://arxiv.org/abs/2007.09964}, eprinttype = {arXiv}, eprint = {2007.09964}, timestamp = {Tue, 28 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-09964.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @phdthesis{DBLP:phd/dnb/Hein19, author = {Daniel Hein}, title = {Interpretable Reinforcement Learning Policies by Evolutionary Computation}, school = {Technical University of Munich, Germany}, year = {2019}, url = {https://nbn-resolving.org/urn:nbn:de:bvb:91-diss-20191009-1467616-1-1}, urn = {urn:nbn:de:bvb:91-diss-20191009-1467616-1-1}, timestamp = {Sat, 17 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/phd/dnb/Hein19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/gecco/0001UR19, author = {Daniel Hein and Steffen Udluft and Thomas A. Runkler}, editor = {Manuel L{\'{o}}pez{-}Ib{\'{a}}{\~{n}}ez and Anne Auger and Thomas St{\"{u}}tzle}, title = {Generating interpretable reinforcement learning policies using genetic programming}, booktitle = {Proceedings of the Genetic and Evolutionary Computation Conference Companion, {GECCO} 2019, Prague, Czech Republic, July 13-17, 2019}, pages = {23--24}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3319619.3326755}, doi = {10.1145/3319619.3326755}, timestamp = {Thu, 23 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/gecco/0001UR19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/eaai/HeinUR18, author = {Daniel Hein and Steffen Udluft and Thomas A. Runkler}, title = {Interpretable policies for reinforcement learning by genetic programming}, journal = {Eng. Appl. Artif. Intell.}, volume = {76}, pages = {158--169}, year = {2018}, url = {https://doi.org/10.1016/j.engappai.2018.09.007}, doi = {10.1016/J.ENGAPPAI.2018.09.007}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/eaai/HeinUR18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/gecco/HeinUR18, author = {Daniel Hein and Steffen Udluft and Thomas A. Runkler}, editor = {Hern{\'{a}}n E. Aguirre and Keiki Takadama}, title = {Generating interpretable fuzzy controllers using particle swarm optimization and genetic programming}, booktitle = {Proceedings of the Genetic and Evolutionary Computation Conference Companion, {GECCO} 2018, Kyoto, Japan, July 15-19, 2018}, pages = {1268--1275}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3205651.3208277}, doi = {10.1145/3205651.3208277}, timestamp = {Fri, 02 Aug 2024 15:50:42 +0200}, biburl = {https://dblp.org/rec/conf/gecco/HeinUR18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-1804-10960, author = {Daniel Hein and Steffen Udluft and Thomas A. Runkler}, title = {Generating Interpretable Fuzzy Controllers using Particle Swarm Optimization and Genetic Programming}, journal = {CoRR}, volume = {abs/1804.10960}, year = {2018}, url = {http://arxiv.org/abs/1804.10960}, eprinttype = {arXiv}, eprint = {1804.10960}, timestamp = {Tue, 04 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1804-10960.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/eaai/HeinHRU17, author = {Daniel Hein and Alexander Hentschel and Thomas A. Runkler and Steffen Udluft}, title = {Particle swarm optimization for generating interpretable fuzzy reinforcement learning policies}, journal = {Eng. Appl. Artif. Intell.}, volume = {65}, pages = {87--98}, year = {2017}, url = {https://doi.org/10.1016/j.engappai.2017.07.005}, doi = {10.1016/J.ENGAPPAI.2017.07.005}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/eaai/HeinHRU17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/ijcnn/HeinUTHRS17, author = {Daniel Hein and Steffen Udluft and Michel Tokic and Alexander Hentschel and Thomas A. Runkler and Volkmar Sterzing}, title = {Batch reinforcement learning on the industrial benchmark: First experiences}, booktitle = {2017 International Joint Conference on Neural Networks, {IJCNN} 2017, Anchorage, AK, USA, May 14-19, 2017}, pages = {4214--4221}, publisher = {{IEEE}}, year = {2017}, url = {https://doi.org/10.1109/IJCNN.2017.7966389}, doi = {10.1109/IJCNN.2017.7966389}, timestamp = {Thu, 23 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcnn/HeinUTHRS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @inproceedings{DBLP:conf/ssci/HeinDTUHRS17, author = {Daniel Hein and Stefan Depeweg and Michel Tokic and Steffen Udluft and Alexander Hentschel and Thomas A. Runkler and Volkmar Sterzing}, title = {A benchmark environment motivated by industrial control problems}, booktitle = {2017 {IEEE} Symposium Series on Computational Intelligence, {SSCI} 2017, Honolulu, HI, USA, November 27 - Dec. 1, 2017}, pages = {1--8}, publisher = {{IEEE}}, year = {2017}, url = {https://doi.org/10.1109/SSCI.2017.8280935}, doi = {10.1109/SSCI.2017.8280935}, timestamp = {Thu, 23 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ssci/HeinDTUHRS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/HeinUTHRS17, author = {Daniel Hein and Steffen Udluft and Michel Tokic and Alexander Hentschel and Thomas A. Runkler and Volkmar Sterzing}, title = {Batch Reinforcement Learning on the Industrial Benchmark: First Experiences}, journal = {CoRR}, volume = {abs/1705.07262}, year = {2017}, url = {http://arxiv.org/abs/1705.07262}, eprinttype = {arXiv}, eprint = {1705.07262}, timestamp = {Tue, 04 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/HeinUTHRS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-1709-09480, author = {Daniel Hein and Stefan Depeweg and Michel Tokic and Steffen Udluft and Alexander Hentschel and Thomas A. Runkler and Volkmar Sterzing}, title = {A Benchmark Environment Motivated by Industrial Control Problems}, journal = {CoRR}, volume = {abs/1709.09480}, year = {2017}, url = {http://arxiv.org/abs/1709.09480}, eprinttype = {arXiv}, eprint = {1709.09480}, timestamp = {Tue, 04 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-09480.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/abs-1712-04170, author = {Daniel Hein and Steffen Udluft and Thomas A. Runkler}, title = {Interpretable Policies for Reinforcement Learning by Genetic Programming}, journal = {CoRR}, volume = {abs/1712.04170}, year = {2017}, url = {http://arxiv.org/abs/1712.04170}, eprinttype = {arXiv}, eprint = {1712.04170}, timestamp = {Tue, 04 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1712-04170.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/ijsir/HeinHRU16, author = {Daniel Hein and Alexander Hentschel and Thomas A. Runkler and Steffen Udluft}, title = {Reinforcement Learning with Particle Swarm Optimization Policy {(PSO-P)} in Continuous State and Action Spaces}, journal = {Int. J. Swarm Intell. Res.}, volume = {7}, number = {3}, pages = {23--42}, year = {2016}, url = {https://doi.org/10.4018/IJSIR.2016070102}, doi = {10.4018/IJSIR.2016070102}, timestamp = {Tue, 29 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijsir/HeinHRU16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/HeinHSTU16, author = {Daniel Hein and Alexander Hentschel and Volkmar Sterzing and Michel Tokic and Steffen Udluft}, title = {Introduction to the "Industrial Benchmark"}, journal = {CoRR}, volume = {abs/1610.03793}, year = {2016}, url = {http://arxiv.org/abs/1610.03793}, eprinttype = {arXiv}, eprint = {1610.03793}, timestamp = {Tue, 04 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/HeinHSTU16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} } @article{DBLP:journals/corr/HeinHRU16, author = {Daniel Hein and Alexander Hentschel and Thomas A. Runkler and Steffen Udluft}, title = {Particle Swarm Optimization for Generating Fuzzy Reinforcement Learning Policies}, journal = {CoRR}, volume = {abs/1610.05984}, year = {2016}, url = {http://arxiv.org/abs/1610.05984}, eprinttype = {arXiv}, eprint = {1610.05984}, timestamp = {Tue, 04 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/HeinHRU16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }