Learning modular structures which reflect the dynamics of the environment can
lead to better generalization and robustness to changes which only affect a few
of the underlying causes. We propose Recurrent Independent Mechanisms (RIMs), a
new recurrent architecture in which multiple groups of recurrent cells operate
with nearly independent transition dynamics, communicate only sparingly through
the bottleneck of attention, and are only updated at time steps where they are
most relevant. We show that this leads to specialization amongst the RIMs,
which in turn allows for dramatically improved generalization on tasks where
some factors of variation differ systematically between training and
evaluation.
%0 Generic
%1 goyal2019recurrent
%A Goyal, Anirudh
%A Lamb, Alex
%A Hoffmann, Jordan
%A Sodhani, Shagun
%A Levine, Sergey
%A Bengio, Yoshua
%A Schölkopf, Bernhard
%D 2019
%K rnn
%T Recurrent Independent Mechanisms
%U http://arxiv.org/abs/1909.10893
%X Learning modular structures which reflect the dynamics of the environment can
lead to better generalization and robustness to changes which only affect a few
of the underlying causes. We propose Recurrent Independent Mechanisms (RIMs), a
new recurrent architecture in which multiple groups of recurrent cells operate
with nearly independent transition dynamics, communicate only sparingly through
the bottleneck of attention, and are only updated at time steps where they are
most relevant. We show that this leads to specialization amongst the RIMs,
which in turn allows for dramatically improved generalization on tasks where
some factors of variation differ systematically between training and
evaluation.
@misc{goyal2019recurrent,
abstract = {Learning modular structures which reflect the dynamics of the environment can
lead to better generalization and robustness to changes which only affect a few
of the underlying causes. We propose Recurrent Independent Mechanisms (RIMs), a
new recurrent architecture in which multiple groups of recurrent cells operate
with nearly independent transition dynamics, communicate only sparingly through
the bottleneck of attention, and are only updated at time steps where they are
most relevant. We show that this leads to specialization amongst the RIMs,
which in turn allows for dramatically improved generalization on tasks where
some factors of variation differ systematically between training and
evaluation.},
added-at = {2019-09-27T20:33:18.000+0200},
author = {Goyal, Anirudh and Lamb, Alex and Hoffmann, Jordan and Sodhani, Shagun and Levine, Sergey and Bengio, Yoshua and Schölkopf, Bernhard},
biburl = {https://www.bibsonomy.org/bibtex/239ad243bc3a59a843fbad4a5a25d7ac9/topel},
interhash = {92ffe8c22b69ca64b56c2f76d8088825},
intrahash = {39ad243bc3a59a843fbad4a5a25d7ac9},
keywords = {rnn},
note = {cite arxiv:1909.10893},
timestamp = {2019-09-27T20:33:18.000+0200},
title = {Recurrent Independent Mechanisms},
url = {http://arxiv.org/abs/1909.10893},
year = 2019
}