@inproceedings{5694c76c36ba4730901d00f6adc29cf6,
title = "Reinforcement-based Program Induction in a Neural Virtual Machine",
abstract = "We present a neural virtual machine that can be trained to perform algorithmic tasks. Rather than combining a neural controller with non-neural memory storage as has been done in the past, this architecture is purely neural and emulates tape-based memory via fast associative weights (one-step learning). Here we formally define the architecture, and then extend the system to learn programs using recurrent policy gradient reinforcement learning based on examples of program inputs labeled with corresponding output targets, which are compared against actual output to generate a sparse reward signal. We describe the policy gradient training procedure used, and report its empirical performance on a number of small-scale list processing tasks, such as finding the maximum list element, filtering out certain elements, and reversing the order of the elements. These results show that program induction via reinforcement learning is possible using sparse rewards and solely neural computations.",
keywords = "Fast Weights, Neural Networks, Policy Gradient, Program Induction",
author = "Katz, {Garrett E.} and Khushboo Gupta and Reggia, {James A.}",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 International Joint Conference on Neural Networks, IJCNN 2020 ; Conference date: 19-07-2020 Through 24-07-2020",
year = "2020",
month = jul,
doi = "10.1109/IJCNN48605.2020.9207671",
language = "English (US)",
series = "Proceedings of the International Joint Conference on Neural Networks",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2020 International Joint Conference on Neural Networks, IJCNN 2020 - Proceedings",
}