forked from attentionagent/attentionagent.github.io
-
Notifications
You must be signed in to change notification settings - Fork 0
/
draft_bib.html
1075 lines (1073 loc) · 42.3 KB
/
draft_bib.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
</dt-appendix>
</body>
<script type="text/bibliography">
@article {core_knowledge,
title = {Core knowledge},
journal = {Developmental Science},
volume = {10},
year = {2007},
pages = {89-96},
url = {http://www.wjh.harvard.edu/~lds/pdfs/SpelkeKinzler07.pdf},
author = {Spelke, E. S and Kinzler, K. D.}
}
@article{brainfacts,
year = 2012,
author = {Brain Facts},
journal = {Brain Facts},
title = "Vision: Processing Information",
url = "https://www.brainfacts.org/thinking-sensing-and-behaving/vision/2012/vision-processing-information",
month = 4,
lastaccessed = "January 10, 2020",
}
@article{Sorokin2015DeepAR,
title={Deep Attention Recurrent Q-Network},
author={Ivan Sorokin and Alexey Seleznev and Mikhail Pavlov and Aleksandr Fedorov and Anastasiia Ignateva},
journal={ArXiv},
year={2015},
volume={abs/1512.01693},
url = {https://arxiv.org/abs/1512.01693},
}
@inproceedings{DBLP:conf/nips/MottZCWR19,
author = {Alexander Mott and
Daniel Zoran and
Mike Chrzanowski and
Daan Wierstra and
Danilo Jimenez Rezende},
title = {Towards Interpretable Reinforcement Learning Using Attention Augmented
Agents},
booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference
on Neural Information Processing Systems 2019, NeurIPS 2019, 8-14
December 2019, Vancouver, BC, Canada},
pages = {12329--12338},
year = {2019},
url = {https://bit.ly/2Ul97za},
timestamp = {Mon, 06 Jan 2020 18:52:01 +0100},
biburl = {https://dblp.org/rec/bib/conf/nips/MottZCWR19},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{hausknecht2012hyperneat,
title={HyperNEAT-GGP: A HyperNEAT-based Atari general game player},
author={Hausknecht, Matthew and Khandelwal, Piyush and Miikkulainen, Risto and Stone, Peter},
booktitle={Proceedings of the 14th annual conference on Genetic and evolutionary computation},
pages={217--224},
year={2012},
url={http://nn.cs.utexas.edu/downloads/papers/hausknecht.gecco12.pdf},
}
@inproceedings{koutnik2013evolving,
title={Evolving large-scale neural networks for vision-based reinforcement learning},
author={Koutnik, Jan and Cuccu, Giuseppe and Schmidhuber, Juergen and Gomez, Faustino},
booktitle={Proceedings of the 15th annual conference on Genetic and evolutionary computation},
pages={1061--1068},
year={2013},
url={http://people.idsia.ch/~juergen/compressednetworksearch.html}
}
@inproceedings{wann2019,
title={Weight agnostic neural networks},
author={Gaier, Adam and Ha, David},
booktitle={Advances in Neural Information Processing Systems},
pages={5365--5379},
year={2019},
url = {https://weightagnostic.github.io},
}
@article{zador2019critique,
title={A critique of pure learning and what artificial neural networks can learn from animal brains},
author={Zador, Anthony M},
journal={Nature communications},
volume={10},
number={1},
pages={1--7},
year={2019},
publisher={Nature Publishing Group},
url={https://www.nature.com/articles/s41467-019-11786-6}
}
@article{stanley2009hyperneat,
title={A hypercube-based encoding for evolving large-scale neural networks},
author={Stanley, Kenneth O and D'Ambrosio, David B and Gauci, Jason},
journal={Artificial life},
volume={15},
number={2},
pages={185--212},
year={2009},
publisher={MIT Press},
url={http://eplex.cs.ucf.edu/hyperNEATpage/}
}
@inproceedings{schmidhuber1993self,
title={A ‘self-referential’ weight matrix},
author={Schmidhuber, Juergen},
booktitle={International Conference on Artificial Neural Networks},
pages={446--450},
year={1993},
organization={Springer},
url={https://mediatum.ub.tum.de/doc/814784/file.pdf}
}
@inproceedings{clune2009evolving,
title={Evolving coordinated quadruped gaits with the HyperNEAT generative encoding},
author={Clune, Jeff and Beckmann, Benjamin E and Ofria, Charles and Pennock, Robert T},
booktitle={2009 iEEE congress on evolutionary computation},
pages={2764--2771},
year={2009},
organization={IEEE},
url={https://bit.ly/2SqUrNJ}
}
@inproceedings{risi2013confronting,
title={Confronting the challenge of learning a flexible neural controller for a diversity of morphologies},
author={Risi, Sebastian and Stanley, Kenneth O},
booktitle={Proceedings of the 15th annual conference on Genetic and evolutionary computation},
pages={255--262},
year={2013},
url={https://eplex.cs.ucf.edu/papers/risi_gecco13b.pdf}
}
@article{stanley2007cppn,
title={Compositional pattern producing networks: A novel abstraction of development},
author={Stanley, Kenneth O},
journal={Genetic programming and evolvable machines},
volume={8},
number={2},
pages={131--162},
year={2007},
publisher={Springer},
url={https://eplex.cs.ucf.edu/papers/stanley_gpem07.pdf}
}
@article{otorogallery,
title={CPPN-NEAT produced artworks},
author={David Ha},
journal={blog.otoro.net},
url={http://otoro.net/gallery},
year={2015}
}
@inproceedings{opennmt,
author = {Guillaume Klein and
Yoon Kim and
Yuntian Deng and
Jean Senellart and
Alexander M. Rush},
title = {OpenNMT: Open-Source Toolkit for Neural Machine Translation},
booktitle = {Proc. ACL},
year = {2017},
url = {https://doi.org/10.18653/v1/P17-4012},
doi = {10.18653/v1/P17-4012}
}
@article{dai2019transformer,
title={Transformer-xl: Attentive language models beyond a fixed-length context},
author={Dai, Zihang and Yang, Zhilin and Yang, Yiming and Carbonell, Jaime and Le, Quoc V and Salakhutdinov, Ruslan},
journal={arXiv preprint arXiv:1901.02860},
url={https://arxiv.org/abs/1901.02860},
year={2019}
}
@article{risi2012enhanced,
title={An enhanced hypercube-based encoding for evolving the placement, density, and connectivity of neurons},
author={Risi, Sebastian and Stanley, Kenneth O},
journal={Artificial Life},
volume={18},
number={4},
pages={331--363},
year={2012},
url={https://eplex.cs.ucf.edu/papers/risi_alife12.pdf}
}
@incollection{NIPS2017_7181,
title = {Attention is All you Need},
author = {Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, Lukasz and Polosukhin, Illia},
booktitle = {Advances in Neural Information Processing Systems 30},
editor = {I. Guyon and U. V. Luxburg and S. Bengio and H. Wallach and R. Fergus and S. Vishwanathan and R. Garnett},
pages = {5998--6008},
year = {2017},
publisher = {Curran Associates, Inc.},
url = {http://papers.nips.cc/paper/7181-attention-is-all-you-need.pdf}
}
@inproceedings{devlin-etal-2019-bert,
title = "BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding",
author = "Devlin, Jacob and
Chang, Ming-Wei and
Lee, Kenton and
Toutanova, Kristina",
booktitle = "Proceedings of the 2019 Conference of the North {A}merican Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)",
month = jun,
year = "2019",
address = "Minneapolis, Minnesota",
publisher = "Association for Computational Linguistics",
url = "https://www.aclweb.org/anthology/N19-1423",
doi = "10.18653/v1/N19-1423",
pages = "4171--4186",
}
@article{radford2019language,
title={Language Models are Unsupervised Multitask Learners},
author={Radford, Alec and Wu, Jeff and Child, Rewon and Luan, David and Amodei, Dario and Sutskever, Ilya},
year={2019},
url={https://bit.ly/31PMViq}
}
@inproceedings{
DBLP:journals/corr/abs-1911-03584,
title={On the Relationship between Self-Attention and Convolutional Layers},
author={Jean-Baptiste Cordonnier and Andreas Loukas and Martin Jaggi},
booktitle={International Conference on Learning Representations},
year={2020},
url={https://openreview.net/forum?id=HJlnC1rKPB}
}
@inproceedings{DBLP:conf/nips/ParmarRVBLS19,
author = {Niki Parmar and
Prajit Ramachandran and
Ashish Vaswani and
Irwan Bello and
Anselm Levskaya and
Jon Shlens},
title = {Stand-Alone Self-Attention in Vision Models},
booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference
on Neural Information Processing Systems 2019, NeurIPS 2019, 8-14
December 2019, Vancouver, BC, Canada},
pages = {68--80},
year = {2019},
url = {http://papers.nips.cc/paper/8302-stand-alone-self-attention-in-vision-models},
timestamp = {Mon, 13 Jan 2020 09:28:31 +0100},
biburl = {https://dblp.org/rec/bib/conf/nips/ParmarRVBLS19},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{hu2019local,
title={Local relation networks for image recognition},
author={Hu, Han and Zhang, Zheng and Xie, Zhenda and Lin, Stephen},
booktitle={Proceedings of the IEEE International Conference on Computer Vision},
pages={3464--3473},
year={2019},
url={https://arxiv.org/abs/1904.11491}
}
@inproceedings{bello2019attention,
title={Attention augmented convolutional networks},
author={Bello, Irwan and Zoph, Barret and Vaswani, Ashish and Shlens, Jonathon and Le, Quoc V},
booktitle={Proceedings of the IEEE International Conference on Computer Vision},
pages={3286--3295},
year={2019},
url={https://arxiv.org/abs/1904.09925}
}
@article{DBLP:journals/tciaig/WydmuchKJ19,
author = {Marek Wydmuch and
Michal Kempka and
Wojciech Jaskowski},
title = {ViZDoom Competitions: Playing Doom From Pixels},
journal = {{IEEE} Trans. Games},
volume = {11},
number = {3},
pages = {248--259},
year = {2019},
doi = {10.1109/TG.2018.2877047},
timestamp = {Sat, 12 Oct 2019 12:50:29 +0200},
bibsource = {dblp computer science bibliography, https://dblp.org},
url={https://arxiv.org/abs/1809.03470}
}
@book{dehaene2014consciousness,
title={Consciousness and the brain: Deciphering how the brain codes our thoughts},
author={Dehaene, Stanislas},
year={2014},
publisher={Penguin},
url={https://en.wikipedia.org/wiki/Consciousness_and_the_Brain}
}
@article{mnih2013playing,
title={Playing atari with deep reinforcement learning},
author={Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Graves, Alex and Antonoglou, Ioannis and Wierstra, Daan and Riedmiller, Martin},
journal={arXiv preprint arXiv:1312.5602},
url = {https://arxiv.org/abs/1312.5602},
year={2013}
}
@article{mnih2015humanlevel,
title={Human-level control through deep reinforcement learning},
author={Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Rusu, Andrei A and Veness, Joel and Bellemare, Marc G and Graves, Alex and Riedmiller, Martin and Fidjeland, Andreas K and Ostrovski, Georg and others},
journal={Nature},
volume={518},
number={7540},
pages={529--533},
year={2015},
publisher={Nature Publishing Group},
url = {https://daiwk.github.io/assets/dqn.pdf},
}
@article{vul2009attention,
title={Attention as inference: selection is probabilistic; responses are all-or-none samples.},
author={Vul, Edward and Hanus, Deborah and Kanwisher, Nancy},
journal={Journal of Experimental Psychology: General},
volume={138},
number={4},
pages={546},
year={2009},
publisher={American Psychological Association},
url={https://www.ncbi.nlm.nih.gov/pmc/articles/PMC2822457/}
}
@article{salimans2017evolution,
title={Evolution Strategies as a Scalable Alternative to Reinforcement Learning},
author = {Salimans, T. and Ho, J. and Chen, X. and Sidor, S. and Sutskever, I.},
journal={Preprint arXiv:1703.03864},
year={2017},
url={https://arxiv.org/abs/1703.03864}
}
@article{ha2017evolving,
title={Evolving Stable Strategies},
author = {Ha, D.},
journal={http://blog.otoro.net/},
year={2017},
url="http://blog.otoro.net/2017/11/12/evolving-stable-strategies/"
}
@article{such2017deep,
title={Deep neuroevolution: Genetic algorithms are a competitive alternative for training deep neural networks for reinforcement learning},
author={Such, Felipe Petroski and Madhavan, Vashisht and Conti, Edoardo and Lehman, Joel and Stanley, Kenneth O and Clune, Jeff},
journal={arXiv preprint arXiv:1712.06567},
year={2017},
url={https://arxiv.org/abs/1712.06567}
}
@article{ha2018designrl,
author = {David Ha},
title = {Reinforcement Learning for Improving Agent Design},
journal = {arXiv:1810.03779},
url = {https://designrl.github.io},
year = {2018}
}
@inproceedings{mania2018simple,
title={Simple random search of static linear policies is competitive for reinforcement learning},
author={Mania, Horia and Guy, Aurelia and Recht, Benjamin},
booktitle={Advances in Neural Information Processing Systems},
pages={1800--1809},
year={2018},
url={https://papers.nips.cc/paper/7451-simple-random-search-of-static-linear-policies-is-competitive-for-reinforcement-learning.pdf}
}
@inproceedings{ha2017hypernetworks,
title={Hypernetworks},
author={Ha, David and Dai, Andrew and Le, Quoc V},
booktitle={Fifth International Conference on Learning Representations (ICLR 2017)},
url={https://openreview.net/forum?id=rkpACe1lx},
year={2017}
}
@article{schmidhuber1991learning,
title={Learning to generate artificial fovea trajectories for target detection},
author={Schmidhuber, Juergen and Huber, Rudolf},
journal={International Journal of Neural Systems},
volume={2},
number={01n02},
pages={125--134},
year={1991},
publisher={World Scientific},
url={http://people.idsia.ch/~juergen/attentive.html}
}
@inproceedings{stollenga2014deep,
title={Deep networks with internal selective attention through feedback connections},
author={Stollenga, Marijn F and Masci, Jonathan and Gomez, Faustino and Schmidhuber, Juergen},
booktitle={Advances in neural information processing systems},
pages={3545--3553},
year={2014},
url={https://arxiv.org/abs/1407.3068}
}
@inproceedings{
zambaldi2018deep,
title={Deep reinforcement learning with relational inductive biases},
author={Vinicius Zambaldi and David Raposo and Adam Santoro and Victor Bapst and Yujia Li and Igor Babuschkin and Karl Tuyls and David Reichert and Timothy Lillicrap and Edward Lockhart and Murray Shanahan and Victoria Langston and Razvan Pascanu and Matthew Botvinick and Oriol Vinyals and Peter Battaglia},
booktitle={International Conference on Learning Representations},
year={2019},
url={https://openreview.net/forum?id=HkxaFoC9KQ},
}
@article{Sorokin2015DeepAR,
title={Deep Attention Recurrent Q-Network},
author={Ivan Sorokin and Alexey Seleznev and Mikhail Pavlov and Aleksandr Fedorov and Anastasiia Ignateva},
journal={ArXiv},
year={2015},
volume={abs/1512.01693},
url={https://arxiv.org/abs/1512.01693}
}
@inproceedings{DBLP:conf/aaai/ChoiLZ17,
author = {Jinyoung Choi and
Beom{-}Jin Lee and
Byoung{-}Tak Zhang},
title = {Multi-Focus Attention Network for Efficient Deep Reinforcement Learning},
booktitle = {The Workshops of the The Thirty-First {AAAI} Conference on Artificial
Intelligence, Saturday, February 4-9, 2017, San Francisco, California,
{USA}},
year = {2017},
url = {http://aaai.org/ocs/index.php/WS/AAAIW17/paper/view/15100},
timestamp = {Wed, 24 Apr 2019 10:44:20 +0200},
biburl = {https://dblp.org/rec/bib/conf/aaai/ChoiLZ17},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{bloem2018,
title={Transformers from Scratch},
author = {Peter Bloem},
journal={http://www.peterbloem.nl/},
year={2019},
url="http://www.peterbloem.nl/blog/transformers"
}
@inproceedings{munkhdalai2017meta,
title={Meta networks},
author={Munkhdalai, Tsendsuren and Yu, Hong},
booktitle={Proceedings of the 34th International Conference on Machine Learning-Volume 70},
pages={2554--2563},
year={2017},
organization={JMLR. org},
url={https://arxiv.org/abs/1703.00837}
}
@inproceedings{chen2018neural,
title={Neural ordinary differential equations},
author={Chen, Tian Qi and Rubanova, Yulia and Bettencourt, Jesse and Duvenaud, David K},
booktitle={Advances in neural information processing systems},
pages={6571--6583},
year={2018},
url={https://arxiv.org/abs/1806.07366}
}
@article{dumoulin2018featurewise,
author = {Dumoulin, Vincent and Perez, Ethan and Schucher, Nathan and Strub, Florian and Vries, Harm de and Courville, Aaron and Bengio, Yoshua},
title = {Feature-wise transformations},
journal = {Distill},
year = {2018},
url = {https://distill.pub/2018/feature-wise-transformations},
doi = {10.23915/distill.00011}
}
@inproceedings{Oswald2020Continual,
title={Continual learning with hypernetworks},
author={Johannes von Oswald and Christian Henning and João Sacramento and Benjamin F. Grewe},
booktitle={International Conference on Learning Representations},
year={2020},
url={https://openreview.net/forum?id=SJgwNerKvB}
}
@inproceedings{ba2016using,
title={Using fast weights to attend to the recent past},
author={Ba, Jimmy and Hinton, Geoffrey E and Mnih, Volodymyr and Leibo, Joel Z and Ionescu, Catalin},
booktitle={Advances in Neural Information Processing Systems},
pages={4331--4339},
year={2016},
url={https://arxiv.org/abs/1610.06258}
}
@article{miconi2018differentiable,
title={Differentiable plasticity: training plastic neural networks with backpropagation},
author={Miconi, Thomas and Clune, Jeff and Stanley, Kenneth O},
journal={arXiv preprint arXiv:1804.02464},
year={2018},
url={https://arxiv.org/abs/1804.02464}
}
@book{hebb1949organization,
title={The organization of behavior},
author={Hebb, Donald O},
year={1949},
publisher={na},
url={https://en.wikipedia.org/wiki/Hebbian_theory}
}
@article{koren2009matrix,
title={Matrix factorization techniques for recommender systems},
author={Koren, Yehuda and Bell, Robert and Volinsky, Chris},
journal={Computer},
volume={42},
number={8},
pages={30--37},
year={2009},
publisher={IEEE},
url={https://datajobs.com/data-science-repo/Recommender-Systems-[Netflix].pdf}
}
@online{pineau2018,
author = {Joelle Pineau},
title = {Reproducible, Reusable, and Robust Reinforcement Learning - NeurIPS 2018},
year = 2018,
url = {https://youtu.be/Kee4ch3miVA?t=2077},
urldate = {2020-2-1}
}
@online{catvideo2015,
author = {Extraordinary Epic},
title = {Fat Cat Fail Vines Compilation},
publisher = {Video from YouTube (Creative Commons license, reuse allowed)},
year = 2015,
url = "https://youtu.be/zeeH-Z_Y4as",
urldate = {2020-3-1}
}
@online{kof2019,
author = {Satsui Hado},
title = {The King of Fighters '98 Arcade Playthrough},
year = 2019,
publisher = {The King of Fighters is a registered trademark of SNK Playmore Corporation.<br/>Video from YouTube (Creative Commons license, reuse allowed)},
url = {https://youtu.be/Q3fpMQ3uqBQ},
urldate = {2020-3-1}
}
@article{zhang2018natural,
title={Natural environment benchmarks for reinforcement learning},
author={Zhang, Amy and Wu, Yuxin and Pineau, Joelle},
journal={arXiv preprint arXiv:1811.06032},
year={2018},
url={https://arxiv.org/abs/1811.06032}
}
@book{mack1998inattentional,
title={Inattentional blindness},
author={Mack, Arien and Rock, Irvin and others},
year={1998},
publisher={MIT press},
url={https://en.wikipedia.org/wiki/Inattentional_blindness}
}
@book{kahneman2011thinking,
author = {Kahneman, Daniel},
publisher = {Farrar, Straus and Giroux},
title = {Thinking, Fast and Slow},
url = {https://en.wikipedia.org/wiki/Thinking,_Fast_and_Slow},
year = {2011}
}
@inproceedings{cuccu2019playing,
title={Playing atari with six neurons},
author={Cuccu, Giuseppe and Togelius, Julian and Cudre-Mauroux, Philippe},
booktitle={Proceedings of the 18th international conference on autonomous agents and multiagent systems},
pages={998--1006},
year={2019},
organization={International Foundation for Autonomous Agents and Multiagent Systems},
url={https://arxiv.org/abs/1806.01363}
}
@article{hochreiter1997long,
author = {Hochreiter, Sepp and Schmidhuber, Juergen},
journal = {Neural computation},
keywords = {lstm rnn},
number = 8,
pages = {1735--1780},
publisher = {MIT Press},
title = {Long short-term memory},
volume = 9,
year = {1997},
url = {http://people.idsia.ch/~juergen/rnn.html}
}
@incollection{Hansen2006,
title={The CMA evolution strategy: a comparing review},
author={Hansen, Nikolaus},
booktitle={Towards a new evolutionary computation},
pages={75--102},
year={2006},
publisher={Springer},
url={https://bit.ly/39TxcBR}
}
@article{es_on_gke,
title={How to run evolution strategies on Google Kubernetes Engine},
author = {Yujin Tang and David Ha},
journal={https://cloud.google.com/blog},
year={2019},
url="https://cloud.google.com/blog/products/ai-machine-learning/how-to-run-evolution-strategies-on-google-kubernetes-engine"
}
@article{otoro_blog,
title={A Visual Guide to Evolution Strategies},
author = {David Ha},
journal={http://blog.otoro.net},
year={2017},
url="http://blog.otoro.net/2017/10/29/visual-evolution-strategies/"
}
@inproceedings{10.1007/978-3-319-99259-4_33,
title={Challenges in high-dimensional reinforcement learning with evolution strategies},
author={Muller, Nils and Glasmachers, Tobias},
booktitle={International Conference on Parallel Problem Solving from Nature},
pages={411--423},
year={2018},
organization={Springer},
url={https://arxiv.org/abs/1806.01224}
}
@misc{hansen2019pycma,
author = {Nikolaus Hansen and Youhei Akimoto and Petr Baudis},
title = {CMA-ES/pycma on Github},
howpublished = {Zenodo, DOI:10.5281/zenodo.2559634},
month = feb,
year = {2019},
doi = {10.5281/zenodo.2559634},
url = {https://doi.org/10.5281/zenodo.2559634},
}
@ARTICLE{brockman2016openai,
author = {Brockman, G. and Cheung, V. and Pettersson, L. and Schneider, J. and Schulman, J. and Tang, J. and Zaremba, W.},
title={OpenAI Gym},
journal={Preprint arXiv:1606.01540},
year = 2016,
month = jun,
url = {https://arxiv.org/abs/1606.01540},
}
@online{CarRacing-v0,
year = {2016},
author = {Oleg Klimov},
title = "CarRacing-v0",
url = "https://gym.openai.com/envs/CarRacing-v0/",
lastaccessed = "January 17, 2020",
}
@online{DoomTakeCover-v0,
year = {2017},
author = {Philip Paquette},
title = "DoomTakeCover-v0",
url = "https://gym.openai.com/envs/DoomTakeCover-v0/",
lastaccessed = "January 17, 2020",
}
@inproceedings{DBLP:conf/cig/KempkaWRTJ16,
author = {Michal Kempka and
Marek Wydmuch and
Grzegorz Runc and
Jakub Toczek and
Wojciech Jaskowski},
title = {ViZDoom: A Doom-based AI research platform for visual reinforcement
learning},
booktitle = {IEEE Conference on Computational Intelligence and Games, CIG 2016,
Santorini, Greece, September 20-23, 2016},
pages = {1--8},
year = {2016},
url = {https://doi.org/10.1109/CIG.2016.7860433},
doi = {10.1109/CIG.2016.7860433},
timestamp = {Wed, 16 Oct 2019 14:14:56 +0200},
biburl = {https://dblp.org/rec/bib/conf/cig/KempkaWRTJ16},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@incollection{ha2018worldmodels,
title = {Recurrent World Models Facilitate Policy Evolution},
author = {Ha, David and Schmidhuber, Juergen},
booktitle = {Advances in Neural Information Processing Systems 31},
pages = {2451--2463},
year = {2018},
publisher = {Curran Associates, Inc.},
url = {https://worldmodels.github.io},
}
@article{hafner2018learning,
title={Learning latent dynamics for planning from pixels},
author={Hafner, Danijar and Lillicrap, Timothy and Fischer, Ian and Villegas, Ruben and Ha, David and Lee, Honglak and Davidson, James},
journal={arXiv preprint arXiv:1811.04551},
url={https://planetrl.github.io/},
year={2018}
}
@article{kaiser2019model,
title={Model-based reinforcement learning for atari},
author={Kaiser, Lukasz and Babaeizadeh, Mohammad and Milos, Piotr and Osinski, Blazej and Campbell, Roy H and Czechowski, Konrad and Erhan, Dumitru and Finn, Chelsea and Kozakowski, Piotr and Levine, Sergey and others},
journal={arXiv preprint arXiv:1903.00374},
year={2019},
url = {https://arxiv.org/abs/1903.00374},
}
@inproceedings{freeman2019learning,
title={Learning to Predict Without Looking Ahead: World Models Without Forward Prediction},
author={Freeman, Daniel and Ha, David and Metz, Luke},
booktitle={Advances in Neural Information Processing Systems},
pages={5380--5391},
year={2019},
url={https://learningtopredict.github.io/}
}
@article{DBLP:journals/corr/abs-1911-08265,
author = {Julian Schrittwieser and
Ioannis Antonoglou and
Thomas Hubert and
Karen Simonyan and
Laurent Sifre and
Simon Schmitt and
Arthur Guez and
Edward Lockhart and
Demis Hassabis and
Thore Graepel and
Timothy P. Lillicrap and
David Silver},
title = {Mastering Atari, Go, Chess and Shogi by Planning with a Learned Model},
journal = {CoRR},
volume = {abs/1911.08265},
year = {2019},
url = {http://arxiv.org/abs/1911.08265},
archivePrefix = {arXiv},
eprint = {1911.08265},
timestamp = {Mon, 02 Dec 2019 17:48:37 +0100},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{gelada2019deepmdp,
title={Deepmdp: Learning continuous latent space models for representation learning},
author={Gelada, Carles and Kumar, Saurabh and Buckman, Jacob and Nachum, Ofir and Bellemare, Marc G},
journal={arXiv preprint arXiv:1906.02736},
year={2019},
url={https://arxiv.org/abs/1906.02736}
}
@inproceedings{DBLP:conf/gecco/RisiS19,
author = {Sebastian Risi and
Kenneth O. Stanley},
title = {Deep neuroevolution of recurrent and discrete world models},
booktitle = {Proceedings of the Genetic and Evolutionary Computation Conference,
GECCO 2019, Prague, Czech Republic, July 13-17, 2019},
pages = {456--462},
year = {2019},
url = {https://arxiv.org/abs/1906.08857},
doi = {10.1145/3321707.3321817},
timestamp = {Thu, 04 Jul 2019 12:06:53 +0200},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-01683,
author = {Sebastian Risi and
Kenneth O. Stanley},
title = {Improving Deep Neuroevolution via Deep Innovation Protection},
journal = {CoRR},
volume = {abs/2001.01683},
year = {2020},
url = {http://arxiv.org/abs/2001.01683},
archivePrefix = {arXiv},
eprint = {2001.01683},
timestamp = {Fri, 10 Jan 2020 13:10:19 +0100},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{such2017deep,
title={Deep neuroevolution: Genetic algorithms are a competitive alternative for training deep neural networks for reinforcement learning},
author={Such, Felipe Petroski and Madhavan, Vashisht and Conti, Edoardo and Lehman, Joel and Stanley, Kenneth O and Clune, Jeff},
journal={arXiv preprint arXiv:1712.06567},
url = {http://arxiv.org/abs/1712.06567},
year={2017}
}
@inproceedings{mnih2014recurrent,
title={Recurrent models of visual attention},
author={Mnih, Volodymyr and Heess, Nicolas and Graves, Alex and others},
booktitle={Advances in neural information processing systems},
pages={2204--2212},
year={2014},
url={https://arxiv.org/abs/1406.6247}
}
@article{ye2020rotation,
title={Rotation, Translation, and Cropping for Zero-Shot Generalization},
author={Ye, Chang and Khalifa, Ahmed and Bontrager, Philip and Togelius, Julian},
journal={arXiv preprint arXiv:2001.09908},
year={2020},
url={https://arxiv.org/abs/2001.09908}
}
@article{zhao2019investigating,
title={Investigating generalisation in continuous deep reinforcement learning},
author={Zhao, Chenyang and Siguad, Olivier and Stulp, Freek and Hospedales, Timothy M},
journal={arXiv preprint arXiv:1902.07015},
year={2019},
url={https://arxiv.org/abs/1902.07015}
}
@article{packer2018assessing,
title={Assessing generalization in deep reinforcement learning},
author={Packer, Charles and Gao, Katelyn and Kos, Jernej and Kr{\"a}henb{\"u}hl, Philipp and Koltun, Vladlen and Song, Dawn},
journal={arXiv preprint arXiv:1810.12282},
year={2018},
url={https://arxiv.org/abs/1810.12282}
}
@article{agarwal2019learning,
title={Learning to generalize from sparse and underspecified rewards},
author={Agarwal, Rishabh and Liang, Chen and Schuurmans, Dale and Norouzi, Mohammad},
journal={arXiv preprint arXiv:1902.07198},
year={2019},
url={https://arxiv.org/abs/1902.07198}
}
@article{hill2019emergent,
title={Emergent systematic generalization in a situated agent},
author={Hill, Felix and Lampinen, Andrew and Schneider, Rosalia and Clark, Stephen and Botvinick, Matthew and McClelland, James L and Santoro, Adam},
journal={arXiv preprint arXiv:1910.00571},
year={2019},
url={https://arxiv.org/abs/1910.00571}
}
@article{cobbe2018quantifying,
title={Quantifying generalization in reinforcement learning},
author={Cobbe, Karl and Klimov, Oleg and Hesse, Chris and Kim, Taehoon and Schulman, John},
journal={arXiv preprint arXiv:1812.02341},
year={2018},
url={https://arxiv.org/abs/1812.02341}
}
@article{juliani2019obstacle,
title={Obstacle tower: A generalization challenge in vision, control, and planning},
author={Juliani, Arthur and Khalifa, Ahmed and Berges, Vincent-Pierre and Harper, Jonathan and Teng, Ervin and Henry, Hunter and Crespi, Adam and Togelius, Julian and Lange, Danny},
journal={arXiv preprint arXiv:1902.01378},
year={2019},
url={https://arxiv.org/abs/1902.01378}
}
@inproceedings{adebayo2018sanity,
title={Sanity checks for saliency maps},
author={Adebayo, Julius and Gilmer, Justin and Muelly, Michael and Goodfellow, Ian and Hardt, Moritz and Kim, Been},
booktitle={Advances in Neural Information Processing Systems},
pages={9505--9515},
year={2018},
url={https://arxiv.org/abs/1810.03292}
}
@article{Ding2019ImprovingSS,
title={Improving Semantic Segmentation of Aerial Images Using Patch-based Attention},
author={Lei Ding and Hao Tang and Lorenzo Bruzzone},
journal={ArXiv},
year={2019},
url={https://arxiv.org/abs/1911.08877}
}
@article{DBLP:journals/corr/abs-1904-01784,
author = {Yuning Chai},
title = {Patchwork: A Patch-wise Attention Network for Efficient Object Detection
and Segmentation in Video Streams},
journal = {CoRR},
volume = {abs/1904.01784},
year = {2019},
url = {http://arxiv.org/abs/1904.01784},
archivePrefix = {arXiv},
eprint = {1904.01784},
timestamp = {Wed, 24 Apr 2019 12:21:25 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-1904-01784.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{sumbul2019cnn,
title={A CNN-RNN Framework with a Novel Patch-Based Multi-Attention Mechanism for Multi-Label Image Classification in Remote Sensing},
author={Sumbul, Gencer and Demir, Begum},
journal={arXiv preprint arXiv:1902.11274},
year={2019},
url = {https://arxiv.org/abs/1902.11274}
}
@article{DBLP:journals/corr/abs-1905-02793,
title={Skin Lesion Classification Using CNNs with Patch-Based Attention and Diagnosis-Guided Loss Weighting},
author={Gessert, Nils and Sentker, Thilo and Madesta, Frederic and Schmitz, Rudiger and Kniep, Helge and Baltruschat, Ivo and Werner, Rene and Schlaefer, Alexander},
journal={IEEE Transactions on Biomedical Engineering},
year={2019},
publisher={IEEE},
url={https://arxiv.org/abs/1905.02793}
}
@incollection{NIPS2019_8359,
title={Saccader: Improving Accuracy of Hard Attention Models for Vision},
author={Elsayed, Gamaleldin and Kornblith, Simon and Le, Quoc V},
booktitle={Advances in Neural Information Processing Systems},
pages={700--712},
year={2019},
url = {https://arxiv.org/abs/1908.07644}
}
@article{stanley2003taxonomy,
title={A taxonomy for artificial embryogeny},
author={Stanley, Kenneth O and Miikkulainen, Risto},
journal={Artificial Life},
volume={9},
number={2},
pages={93--130},
year={2003},
publisher={MIT Press},
url={http://nn.cs.utexas.edu/?stanley:alife03}
}
@article{clune2011performance,
title={On the performance of indirect encoding across the continuum of regularity},
author={Clune, Jeff and Stanley, Kenneth O and Pennock, Robert T and Ofria, Charles},
journal={IEEE Transactions on Evolutionary Computation},
volume={15},
number={3},
pages={346--367},
year={2011},
publisher={IEEE},
url={https://bit.ly/2V8g3QG}
}
@article{schmidhuber1997discovering,
title={Discovering neural nets with low Kolmogorov complexity and high generalization capability},
author={Schmidhuber, Juergen},
journal={Neural Networks},
volume={10},
number={5},
pages={857--873},
year={1997},
publisher={Elsevier},
url={ftp://ftp.idsia.ch/pub/juergen/loconet.pdf}
}
@inproceedings{gauci2008case,
title={A Case Study on the Critical Role of Geometric Regularity in Machine Learning.},
author={Gauci, Jason and Stanley, Kenneth O},
booktitle={AAAI},
pages={628--633},
year={2008},
url={https://www.aaai.org/Papers/AAAI/2008/AAAI08-100.pdf}
}
@inproceedings{gauci2010indirect,
title={Indirect encoding of neural networks for scalable Go},
author={Gauci, Jason and Stanley, Kenneth O},
booktitle={International Conference on Parallel Problem Solving from Nature},
pages={354--363},
year={2010},
organization={Springer},
url={http://eplex.cs.ucf.edu/papers/gauci_ppsn10.pdf}
}
@inproceedings{finn2016deep,
title={Deep spatial autoencoders for visuomotor learning},
author={Finn, Chelsea and Tan, Xin Yu and Duan, Yan and Darrell, Trevor and Levine, Sergey and Abbeel, Pieter},
booktitle={2016 IEEE International Conference on Robotics and Automation (ICRA)},
pages={512--519},
year={2016},
organization={IEEE},
url={https://arxiv.org/abs/1509.06113}
}
@article{ramanujan2019s,
title={What's Hidden in a Randomly Weighted Neural Network?},
author={Ramanujan, Vivek and Wortsman, Mitchell and Kembhavi, Aniruddha and Farhadi, Ali and Rastegari, Mohammad},
journal={arXiv preprint arXiv:1911.13299},
year={2019},
url={https://arxiv.org/abs/1911.13299}
}
@inproceedings{
frankle2018the,
title={The Lottery Ticket Hypothesis: Finding Sparse, Trainable Neural Networks},
author={Jonathan Frankle and Michael Carbin},
booktitle={International Conference on Learning Representations},
year={2019},
url={https://openreview.net/forum?id=rJl-b3RcF7},
}
@article{zhou2019deconstructing,
title={Deconstructing Lottery Tickets: Zeros, Signs, and the Supermask},
author={Zhou, Hattie and Lan, Janice and Liu, Rosanne and Yosinski, Jason},
journal={arXiv preprint arXiv:1905.01067},
url={https://arxiv.org/abs/1905.01067},
year={2019}
}
@article{hasson2020direct,
title={Direct Fit to Nature: An Evolutionary Perspective on Biological and Artificial Neural Networks},
author={Hasson, Uri and Nastase, Samuel A and Goldstein, Ariel},
journal={Neuron},
volume={105},
number={3},
pages={416--434},
year={2020},
publisher={Elsevier},
url={https://www.biorxiv.org/content/10.1101/764258v2.full}
}
@inproceedings{krizhevsky2012imagenet,
title={ImageNet classification with deep convolutional neural networks},
author={Krizhevsky, Alex and Sutskever, Ilya and Hinton, Geoffrey E},
booktitle={Advances in neural information processing systems},
pages={1097--1105},
year={2012},
url={https://bit.ly/2w3DcZM}
}
@article{cheung2016emergence,
title={Emergence of foveal image sampling from learning to attend in visual scenes},
author={Cheung, Brian and Weiss, Eric and Olshausen, Bruno},
journal={arXiv preprint arXiv:1611.09430},
year={2016},
url={https://arxiv.org/abs/1611.09430},
}
@article{ba2014multiple,
title={Multiple object recognition with visual attention},
author={Ba, Jimmy and Mnih, Volodymyr and Kavukcuoglu, Koray},
journal={arXiv preprint arXiv:1412.7755},
year={2014},
url={https://arxiv.org/abs/1412.7755}
}
@inproceedings{kansky2017schema,
title={Schema networks: Zero-shot transfer with a generative causal model of intuitive physics},
author={Kansky, Ken and Silver, Tom and M{\'e}ly, David A and Eldawy, Mohamed and L{\'a}zaro-Gredilla, Miguel and Lou, Xinghua and Dorfman, Nimrod and Sidor, Szymon and Phoenix, Scott and George, Dileep},
booktitle={Proceedings of the 34th International Conference on Machine Learning-Volume 70},
pages={1809--1818},
year={2017},
organization={JMLR. org},
url={https://arxiv.org/abs/1706.04317}
}
@article{rosten2008faster,
title={Faster and better: A machine learning approach to corner detection},
author={Rosten, Edward and Porter, Reid and Drummond, Tom},
journal={IEEE transactions on pattern analysis and machine intelligence},
volume={32},
number={1},
pages={105--119},
year={2008},
publisher={IEEE},
url={https://arxiv.org/abs/0810.2434}
}
@inproceedings{kulkarni2019unsupervised,
title={Unsupervised learning of object keypoints for perception and control},
author={Kulkarni, Tejas D and Gupta, Ankush and Ionescu, Catalin and Borgeaud, Sebastian and Reynolds, Malcolm and Zisserman, Andrew and Mnih, Volodymyr},
booktitle={Advances in Neural Information Processing Systems},
pages={10723--10733},
year={2019},
url={https://bit.ly/2wLiEFZ}
}
@article{leibo2018psychlab,
title={Psychlab: a psychology laboratory for deep reinforcement learning agents},
author={Leibo, Joel Z and d'Autume, Cyprien de Masson and Zoran, Daniel and Amos, David and Beattie, Charles and Anderson, Keith and Casta{\~n}eda, Antonio Garc{\'\i}a and Sanchez, Manuel and Green, Simon and Gruslys, Audrunas and others},
journal={arXiv preprint arXiv:1801.08116},
year={2018},
url={https://arxiv.org/abs/1801.08116}
}
@article{beyret2019animal,
title={The Animal-AI Environment: Training and Testing Animal-Like Artificial Cognition},
author={Beyret, Benjamin and Hern{\'a}ndez-Orallo, Jos{\'e} and Cheke, Lucy and Halina, Marta and Shanahan, Murray and Crosby, Matthew},
journal={arXiv preprint arXiv:1909.07483},
year={2019},
url={https://arxiv.org/abs/1909.07483}
}
@inproceedings{sainath2013low,
title={Low-rank matrix factorization for deep neural network training with high-dimensional output targets},
author={Sainath, Tara N and Kingsbury, Brian and Sindhwani, Vikas and Arisoy, Ebru and Ramabhadran, Bhuvana},
booktitle={2013 IEEE international conference on acoustics, speech and signal processing},
pages={6655--6659},
year={2013},
organization={IEEE},
url={https://bit.ly/39ZEF26}
}
@inproceedings{grosse2016kronecker,
title={A kronecker-factored approximate fisher matrix for convolution layers},
author={Grosse, Roger and Martens, James},
booktitle={International Conference on Machine Learning},
pages={573--582},
year={2016},
url={http://www.jmlr.org/proceedings/papers/v48/grosse16.pdf}
}
@inproceedings{suwajanakorn2018discovery,
title={Discovery of latent 3d keypoints via end-to-end geometric reasoning},
author={Suwajanakorn, Supasorn and Snavely, Noah and Tompson, Jonathan J and Norouzi, Mohammad},
booktitle={Advances in Neural Information Processing Systems},
pages={2059--2070},
year={2018},
url={https://keypointnet.github.io/}
}
@inproceedings{
Lee2020Network,
title={Network Randomization: A Simple Technique for Generalization in Deep Reinforcement Learning},
author={Kimin Lee and Kibok Lee and Jinwoo Shin and Honglak Lee},
booktitle={International Conference on Learning Representations},
year={2020},
url={https://openreview.net/forum?id=HJgcvJBFvB}
}
@inproceedings{
Song2020Observational,
title={Observational Overfitting in Reinforcement Learning},
author={Xingyou Song and Yiding Jiang and Stephen Tu and Yilun Du and Behnam Neyshabur},
booktitle={International Conference on Learning Representations},
year={2020},
url={https://openreview.net/forum?id=HJli2hNKDH}
}