Skip to content

Commit c903a3b

Browse files
authored
Update report (#453)
* Update report * fix cspell * Make some changes * Update with implementation details * Update bibliography.bib * Fix some mistakes * Fix typo * Make the suggested changes * Update date * Fix code * add installation instructions * Update cspell.json * Update cspell.json * Added the mentioned changes
1 parent 8d6c5ca commit c903a3b

4 files changed

Lines changed: 443 additions & 1 deletion

File tree

.cspell/cspell.json

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -122,6 +122,8 @@
122122
"turbulences",
123123
"Decompressor",
124124
"MADDPG",
125+
"Prasidh",
126+
"Srikumar",
125127
"Caglar",
126128
"Gulcehre",
127129
"Novikov",
@@ -142,6 +144,7 @@
142144
"reparamaterize",
143145
"MADDPG",
144146
"rldatasets",
147+
"Trichy",
145148
"Prasidh",
146149
"Srikumar"
147150
],

docs/homepage/blog/index.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
@def is_enable_toc = false
44

55
- [An Introduction to ReinforcementLearning.jl: Design, Implementations and Thoughts](/blog/an_introduction_to_reinforcement_learning_jl_design_implementations_thoughts)
6-
6+
- [Establish a General Pipeline for Offline Reinforcement Learning Evaluation (Summer OSPP Project 210370741) Mid-term Report](/blog/ospp_mid-term_report_210370741)
77
- Notebooks for the book: [*Reinforcement Learning: an Introduction 2nd
88
Edition*](https://github.com/JuliaReinforcementLearning/ReinforcementLearningAnIntroduction.jl)
99

Lines changed: 34 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
@misc{fu2020d4rl,
2+
title={D4RL: Datasets for Deep Data-Driven Reinforcement Learning},
3+
author={Justin Fu and Aviral Kumar and Ofir Nachum and George Tucker and Sergey Levine},
4+
year={2020},
5+
eprint={2004.07219},
6+
archivePrefix={arXiv},
7+
primaryClass={cs.LG}
8+
}
9+
@inproceedings{agarwal2020optimistic,
10+
title={An Optimistic Perspective on Offline Reinforcement Learning},
11+
author={Agarwal, Rishabh and Schuurmans, Dale and Norouzi, Mohammad},
12+
journal={International Conference on Machine Learning},
13+
year={2020}
14+
}
15+
@misc{gulcehre2020rl,
16+
title={RL Unplugged: Benchmarks for Offline Reinforcement Learning},
17+
author={Caglar Gulcehre and Ziyu Wang and Alexander Novikov and Tom Le Paine
18+
and Sergio Gómez Colmenarejo and Konrad Zolna and Rishabh Agarwal and
19+
Josh Merel and Daniel Mankowitz and Cosmin Paduraru and Gabriel
20+
Dulac-Arnold and Jerry Li and Mohammad Norouzi and Matt Hoffman and
21+
Ofir Nachum and George Tucker and Nicolas Heess and Nando deFreitas},
22+
year={2020},
23+
eprint={2006.13888},
24+
archivePrefix={arXiv},
25+
primaryClass={cs.LG}
26+
}
27+
@misc{fu2021benchmarks,
28+
title={Benchmarks for Deep Off-Policy Evaluation},
29+
author={Justin Fu and Mohammad Norouzi and Ofir Nachum and George Tucker and Ziyu Wang and Alexander Novikov and Mengjiao Yang and Michael R. Zhang and Yutian Chen and Aviral Kumar and Cosmin Paduraru and Sergey Levine and Tom Le Paine},
30+
year={2021},
31+
eprint={2103.16596},
32+
archivePrefix={arXiv},
33+
primaryClass={cs.LG}
34+
}

0 commit comments

Comments
 (0)