Skip to content

Commit

Permalink
add BlendRL paper
Browse files Browse the repository at this point in the history
  • Loading branch information
hkrsnd committed Dec 5, 2024
1 parent 107b77a commit 3a79d28
Show file tree
Hide file tree
Showing 2 changed files with 13 additions and 0 deletions.
Binary file added images/shindo2024blendrl.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
13 changes: 13 additions & 0 deletions references.bib
Original file line number Diff line number Diff line change
@@ -1,3 +1,16 @@
@misc{shindo2024blendrl_arxiv,
Anote={./images/shindo2024blendrl.png},
author = {Hikaru Shindo and Quentin Delfosse and Devendra Singh Dhami and Kristian Kersting},
title = {BlendRL: A Framework for Merging Symbolic and Neural Policy Learning},
Keywords = {Reinforcement Learning, Neuro-Symbolic AI, Differentiable Reasoning, Interpretable and Explainable AI},
Howpublished = {arXiv preprint arXiv:2410.11689},
year = {2024},
Url = {https://arxiv.org/abs/2410.11689},
Pages = {},
Crossref={https://github.com/ml-research/blendrl},
Note = {Humans can leverage both abstract reasoning and intuitive reactions. In contrast, reinforcement learning policies are typically encoded in either opaque systems like neural networks or symbolic systems that rely on predefined symbols and rules. This disjointed approach severely limits the agents’ capabilities, as they often lack either the flexible low-level reaction characteristic of neural agents or the interpretable reasoning of symbolic agents. To overcome this challenge, we introduce BlendRL, a neuro-symbolic RL framework that harmoniously integrates both paradigms within RL agents that use mixtures of both logic and neural policies. We empirically demonstrate that BlendRL agents outperform both neural and symbolic baselines in standard Atari environments, and showcase their robustness to environmental changes. Additionally, we analyze the interaction between neural and symbolic policies, illustrating how their hybrid use helps agents overcome each other's limitations.}
}

@inproceedings{hintersdorf2024balancingtransparency,
anote = {./images/hintersdorf2024balancingtransparency.png},
author = {Dominik Hintersdorf and Lukas Struppek and Kristian Kersting},
Expand Down

0 comments on commit 3a79d28

Please sign in to comment.