-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathREFERENCES.bib
155 lines (146 loc) · 6.13 KB
/
REFERENCES.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
@misc{bou2023torchrl,
title={TorchRL: A data-driven decision-making library for PyTorch},
author={Albert Bou and Matteo Bettini and Sebastian Dittert and Vikash Kumar and Shagun Sodhani and Xiaomeng Yang and Gianni De Fabritiis and Vincent Moens},
year={2023},
eprint={2306.00577},
archivePrefix={arXiv},
primaryClass={cs.LG}
}
@misc{OpenStreetMap,
author = {{OpenStreetMap contributors}},
title = {{Planet dump retrieved from https://planet.osm.org }},
howpublished = "\url{ https://www.openstreetmap.org }",
year = {2017},
}
@article{DBLP:journals/corr/SchulmanWDRK17,
author = {John Schulman and
Filip Wolski and
Prafulla Dhariwal and
Alec Radford and
Oleg Klimov},
title = {Proximal Policy Optimization Algorithms},
journal = {CoRR},
volume = {abs/1707.06347},
year = {2017},
url = {http://arxiv.org/abs/1707.06347},
eprinttype = {arXiv},
eprint = {1707.06347},
timestamp = {Mon, 13 Aug 2018 16:47:34 +0200},
biburl = {https://dblp.org/rec/journals/corr/SchulmanWDRK17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-14471,
author = {Justin K. Terry and
Benjamin Black and
Ananth Hari and
Luis S. Santos and
Clemens Dieffendahl and
Niall L. Williams and
Yashas Lokesh and
Caroline Horsch and
Praveen Ravi},
title = {PettingZoo: Gym for Multi-Agent Reinforcement Learning},
journal = {CoRR},
volume = {abs/2009.14471},
year = {2020},
url = {https://arxiv.org/abs/2009.14471},
eprinttype = {arXiv},
eprint = {2009.14471},
timestamp = {Wed, 06 Apr 2022 15:36:38 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2009-14471.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@book{book,
author = {Cascetta, Ennio},
year = {2009},
month = {01},
pages = {},
title = {Transportation System Analysis: Models and Applications},
isbn = {SBN 978-0-387-75857-2}
}
@inproceedings{SUMO2018,
title = {Microscopic Traffic Simulation using SUMO},
author = {Pablo Alvarez Lopez and Michael Behrisch and Laura Bieker-Walz and Jakob Erdmann and Yun-Pang Fl{\"o}tter{\"o}d and Robert Hilbrich and Leonhard L{\"u}cken and Johannes Rummel and Peter Wagner and Evamarie Wie{\ss}ner},
publisher = {IEEE},
booktitle = {The 21st IEEE International Conference on Intelligent Transportation Systems},
year = {2018},
journal = {IEEE Intelligent Transportation Systems Conference (ITSC)},
keywords = {traffic simulation, modelling, optimization},
url = {https://elib.dlr.de/124092/}
}
@book{Sutton1998,
added-at = {2019-07-13T10:11:53.000+0200},
author = {Sutton, Richard S. and Barto, Andrew G.},
biburl = {https://www.bibsonomy.org/bibtex/2f46601cf8b13d39d1378af0d79438b12/lanteunis},
edition = {Second},
interhash = {ac6b144aaec1819919a2fba9f705c852},
intrahash = {f46601cf8b13d39d1378af0d79438b12},
keywords = {},
publisher = {The MIT Press},
timestamp = {2019-07-13T10:11:53.000+0200},
title = {Reinforcement Learning: An Introduction},
url = {http://incompleteideas.net/book/the-book-2nd.html},
year = {2018 }
}
@article{DBLP:journals/corr/abs-1803-11485,
author = {Tabish Rashid and
Mikayel Samvelyan and
Christian Schr{\"{o}}der de Witt and
Gregory Farquhar and
Jakob N. Foerster and
Shimon Whiteson},
title = {{QMIX:} Monotonic Value Function Factorisation for Deep Multi-Agent
Reinforcement Learning},
journal = {CoRR},
volume = {abs/1803.11485},
year = {2018},
url = {http://arxiv.org/abs/1803.11485},
eprinttype = {arXiv},
eprint = {1803.11485},
timestamp = {Mon, 13 Aug 2018 16:46:51 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-1803-11485.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-09533,
author = {Christian Schr{\"{o}}der de Witt and
Tarun Gupta and
Denys Makoviichuk and
Viktor Makoviychuk and
Philip H. S. Torr and
Mingfei Sun and
Shimon Whiteson},
title = {Is Independent Learning All You Need in the StarCraft Multi-Agent
Challenge?},
journal = {CoRR},
volume = {abs/2011.09533},
year = {2020},
url = {https://arxiv.org/abs/2011.09533},
eprinttype = {arXiv},
eprint = {2011.09533},
timestamp = {Wed, 25 Nov 2020 16:34:14 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2011-09533.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SunehagLGCZJLSL17,
author = {Peter Sunehag and
Guy Lever and
Audrunas Gruslys and
Wojciech Marian Czarnecki and
Vin{\'{\i}}cius Flores Zambaldi and
Max Jaderberg and
Marc Lanctot and
Nicolas Sonnerat and
Joel Z. Leibo and
Karl Tuyls and
Thore Graepel},
title = {Value-Decomposition Networks For Cooperative Multi-Agent Learning},
journal = {CoRR},
volume = {abs/1706.05296},
year = {2017},
url = {http://arxiv.org/abs/1706.05296},
eprinttype = {arXiv},
eprint = {1706.05296},
timestamp = {Mon, 13 Aug 2018 16:46:26 +0200},
biburl = {https://dblp.org/rec/journals/corr/SunehagLGCZJLSL17.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}