-
Notifications
You must be signed in to change notification settings - Fork 1
/
draft_bib.html
120 lines (111 loc) · 4.02 KB
/
draft_bib.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
</dt-appendix>
</body>
<script type="text/bibliography">
@article{graves2017automated,
title={Automated curriculum learning for neural networks},
author={Graves, Alex and Bellemare, Marc G and Menick, Jacob and Munos, Remi and Kavukcuoglu, Koray},
journal={arXiv preprint},
url={https://arxiv.org/pdf/1704.03003.pdf},
year={2017}
}
@ARTICLE{2016arXiv161101796A,
author = {Andreas, J. and Klein, D. and Levine, S.},
title = {Modular Multitask Reinforcement Learning with Policy Sketches},
journal = {ArXiv e-prints},
archivePrefix = "arXiv",
eprint = {1611.01796},
primaryClass = "cs.LG",
keywords = {Computer Science - Learning, Computer Science - Neural and Evolutionary Computing},
year = 2016,
month = nov,
adsurl = {http://adsabs.harvard.edu/abs/2016arXiv161101796A},
adsnote = {Provided by the SAO/NASA Astrophysics Data System}
}
@article{DBLP:journals/corr/abs-1802-01561,
author = {Lasse Espeholt and
Hubert Soyer and
Remi Munos and
Karen Simonyan and
Volodymyr Mnih and
Tom Ward and
Yotam Doron and
Vlad Firoiu and
Tim Harley and
Iain Dunning and
Shane Legg and
Koray Kavukcuoglu},
title = {IMPALA: Scalable Distributed Deep-RL with Importance Weighted Actor-Learner Architectures},
journal = {Proceedings of the International Conference on Machine Learning (ICML)},
volume = {abs/1802.01561},
year = {2018},
url = {http://arxiv.org/abs/1802.01561},
archivePrefix = {arXiv},
eprint = {1802.01561},
timestamp = {Thu, 01 Mar 2018 15:00:45 +0100},
biburl = {https://dblp.org/rec/bib/journals/corr/abs-1802-01561},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@online{ impala_github,
author = "Espeholt, Lasse and Soyer, Hubert and Munos, Remi and Simonyan, Karen and Mnih, Volodymir and Ward, Tom and Doron, Yotam and Firoiu, Vlad and Harley, Tim and Dunning, Iain",
publisher = "Github",
title = "Github: Scalable Distributed Deep-RL with Importance Weighted Actor-Learner Architectures",
year = "2018",
url = "https://github.com/deepmind/scalable_agent",
note = "[Online; accessed 01-Jul-2018]"
}
@online{ jeju_project_github,
author = "Feryal Behbahani",
publisher = "Github",
title = "Automated Curriculum Learning",
year = "2018",
url = "https://github.com/Feryal/jeju_project",
note = "[Online; accessed 01-Jul-2018]"
}
@article{Auer:2003:NMB:589343.589365,
author = {Auer, Peter and Cesa-Bianchi, Nicolo and Freund, Yoav and Schapire, Robert E.},
title = {The Nonstochastic Multiarmed Bandit Problem},
journal = {SIAM J. Comput.},
issue_date = {2003},
volume = {32},
number = {1},
month = jan,
year = {2003},
issn = {0097-5397},
pages = {48--77},
numpages = {30},
url = {https://doi.org/10.1137/S0097539701398375},
doi = {10.1137/S0097539701398375},
acmid = {589365},
publisher = {Society for Industrial and Applied Mathematics},
address = {Philadelphia, PA, USA},
keywords = {adversarial bandit problem, unknown matrix games},
}
@ARTICLE{2015arXiv150803326Z,
author = {Zhou, L.},
title = {A Survey on Contextual Multi-armed Bandits},
journal = {ArXiv e-prints},
archivePrefix = "arXiv",
eprint = {1508.03326},
primaryClass = "cs.LG",
keywords = {Computer Science - Learning},
year = 2015,
month = aug,
adsurl = {http://adsabs.harvard.edu/abs/2015arXiv150803326Z},
adsnote = {Provided by the SAO/NASA Astrophysics Data System}
}
@ARTICLE{s10_powerplay,
AUTHOR={Schmidhuber, J.},
TITLE={PowerPlay: Training an Increasingly General Problem Solver by Continually Searching for the Simplest Still Unsolvable Problem},
JOURNAL={Frontiers in Psychology},
VOLUME={4},
PAGES={313},
YEAR={2013},
URL={https://www.frontiersin.org/article/10.3389/fpsyg.2013.00313},
DOI={10.3389/fpsyg.2013.00313},
ISSN={1664-1078},
}
</script>
<script>
// Late select first barplot
switchBarplot(1);
</script>