update paper info

hakuhodo-technologies · Dec 1, 2023 · 04d0516 · 04d0516
1 parent 5c5e299
commit 04d0516
Show file tree

Hide file tree

Showing 14 changed files with 28 additions and 35 deletions.
diff --git a/README.md b/README.md
@@ -9,7 +9,8 @@
 [![GitHub last commit](https://img.shields.io/github/last-commit/hakuhodo-technologies/scope-rl)](https://github.com/hakuhodo-technologies/scope-rl/graphs/commit-activity)
 [![Documentation Status](https://readthedocs.org/projects/scope-rl/badge/?version=latest)](https://scope-rl.readthedocs.io/en/latest/)
 [![License](https://img.shields.io/badge/License-Apache%202.0-blue.svg)](https://opensource.org/licenses/Apache-2.0)
-[![arXiv](https://img.shields.io/badge/arXiv-23xx.xxxxx-b31b1b.svg)](https://arxiv.org/abs/23xx.xxxxx)
+[![arXiv](https://img.shields.io/badge/arXiv-2311.18206-b31b1b.svg)](https://arxiv.org/abs/2311.18206)
+[![arXiv](https://img.shields.io/badge/arXiv-2311.18207-b31b1b.svg)](https://arxiv.org/abs/2311.18207)
 
 <details>
 <summary><strong>Table of Contents </strong>(click to expand)</summary>
@@ -442,14 +443,14 @@ If you use our software in your work, please cite our paper:
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
+[[arXiv](https://arxiv.org/abs/2311.18206)] [[slides](https://speakerdeck.com/harukakiyohara_/scope-rl)]
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year={2023},
 }
 ```
@@ -458,14 +459,14 @@ If you use our proposed metric "SharpeRatio@k" in your work, please cite our pap
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
+[[arXiv](https://arxiv.org/abs/2311.18207)] [[slides](https://speakerdeck.com/harukakiyohara_/towards-risk-return-assessment-of-ope)]
 
 Bibtex:
 ```
 @article{kiyohara2023towards,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18207},
   year={2023},
 }
 ```

diff --git a/README_ja.md b/README_ja.md
@@ -9,7 +9,8 @@
 [![GitHub last commit](https://img.shields.io/github/last-commit/hakuhodo-technologies/scope-rl)](https://github.com/hakuhodo-technologies/scope-rl/graphs/commit-activity)
 [![Documentation Status](https://readthedocs.org/projects/scope-rl/badge/?version=latest)](https://scope-rl.readthedocs.io/en/latest/)
 [![License](https://img.shields.io/badge/License-Apache%202.0-blue.svg)](https://opensource.org/licenses/Apache-2.0)
-[![arXiv](https://img.shields.io/badge/arXiv-23xx.xxxxx-b31b1b.svg)](https://arxiv.org/abs/23xx.xxxxx)
+[[![arXiv](https://img.shields.io/badge/arXiv-2311.18206-b31b1b.svg)](https://arxiv.org/abs/2311.18206)
+[![arXiv](https://img.shields.io/badge/arXiv-2311.18207-b31b1b.svg)](https://arxiv.org/abs/2311.18207)
 
 <details>
 <summary><strong>目次</strong>(クリックして展開)</summary>
@@ -450,14 +451,14 @@ ops.visualize_conditional_value_at_risk_for_validation(
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
+[[arXiv](https://arxiv.org/abs/2311.18206)] [[日本語スライド](https://speakerdeck.com/aiueola/scope-rl-ja)]
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year={2023},
 }
 ```
@@ -466,14 +467,14 @@ Bibtex:
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
+[[arXiv](https://arxiv.org/abs/2311.18207)] [[日本語スライド](https://speakerdeck.com/aiueola/towards-risk-return-assessment-of-ope-ja)]
 
 Bibtex:
 ```
 @article{kiyohara2023towards,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18207},
   year={2023},
 }
 ```

diff --git a/basicgym/README.md b/basicgym/README.md
@@ -245,14 +245,13 @@ If you use our software in your work, please cite our paper:
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year = {2023},
 }
 ```

diff --git a/basicgym/README_ja.md b/basicgym/README_ja.md
@@ -246,14 +246,13 @@ class CustomizedRewardFunction(BaseRewardFunction):
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year = {2023},
 }
 ```

diff --git a/docs/conf.py b/docs/conf.py
@@ -81,7 +81,7 @@
     "icon_links": [
         {
             "name": "Speaker Deck",
-            "url": "https://speakerdeck.com/aiueola/ofrl-designing-an-offline-reinforcement-learning-and-policy-evaluation-platform-from-practical-perspectives",
+            "url": "https://speakerdeck.com/harukakiyohara_/scope-rl",
             "icon": "fa-brands fa-speaker-deck",
             "type": "fontawesome",
         },

diff --git a/docs/documentation/index.rst b/docs/documentation/index.rst
@@ -215,14 +215,13 @@ If you use our pipeline in your work, please cite our paper below.
 
     | Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.
     | **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**
-    | (a preprint is coming soon..)
 
     .. code-block::
 
         @article{kiyohara2023scope,
             title={SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
             author={Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nakata, Kazuhide and Saito, Yuta},
-            journal={arXiv preprint arXiv:23xx.xxxxx},
+            journal={arXiv preprint arXiv:2311.18206},
             year={2023}
         }
 
@@ -239,7 +238,7 @@ If you use the proposed metric (SharpeRatio@k) or refer to our findings in your
         @article{kiyohara2023towards,
             title={Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation},
             author={Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nakata, Kazuhide and Saito, Yuta},
-            journal={arXiv preprint arXiv:23xx.xxxxx},
+            journal={arXiv preprint arXiv:2311.18207},
             year={2023}
         }
 

diff --git a/docs/documentation/installation.rst b/docs/documentation/installation.rst
@@ -40,7 +40,7 @@ If you use our pipeline in your work, please cite our paper below.
         @article{kiyohara2023scope,
             title={SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
             author={Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nakata, Kazuhide and Saito, Yuta},
-            journal={arXiv preprint arXiv:23xx.xxxxx},
+            journal={arXiv preprint arXiv:2311.18206},
             year={2023}
         }
 
@@ -50,14 +50,13 @@ If you use the proposed metric (SharpeRatio@k) or refer to our findings in your
 
     | Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.
     | **Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation**
-    | (a preprint is coming soon..)
 
     .. code-block::
 
         @article{kiyohara2023towards,
             title={Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation},
             author={Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nakata, Kazuhide and Saito, Yuta},
-            journal={arXiv preprint arXiv:23xx.xxxxx},
+            journal={arXiv preprint arXiv:2311.18207},
             year={2023}
         }
 

diff --git a/docs/documentation/news.rst b/docs/documentation/news.rst
@@ -6,8 +6,8 @@ Follow us on `Google Group ([email protected]) <https://groups.google.co
 2023
 ~~~~~~~~~~
 
-**2023.12.xx** Preprints of our papers: (1) [SCOPE-RL:  A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation]() ([slides](), [日本語スライド]()), 
-and (2) [Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation]() ([slides](), [日本語スライド]()) are now available at arXiv!
+**2023.12.01** Preprints of our twin papers: (1) `SCOPE-RL:  A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation <https://arxiv.org/abs/2311.18206>`_ (`slides <https://speakerdeck.com/harukakiyohara_/scope-rl>`_, `日本語スライド <https://speakerdeck.com/aiueola/scope-rl-ja>`_), 
+and (2) `Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation <https://arxiv.org/abs/2311.18207>`_ (`slides <https://speakerdeck.com/harukakiyohara_/towards-risk-return-assessment-of-ope>`_, `日本語スライド <https://speakerdeck.com/aiueola/towards-risk-return-assessment-of-ope-ja>`_) are now available at arXiv!
 
 **2023.7.30** Released :class:`v0.2.1` of SCOPE-RL! This release upgrades the version of d3rlpy from  `1.1.1` to `2.0.4`.
 

diff --git a/docs/documentation/sharpe_ratio.rst b/docs/documentation/sharpe_ratio.rst
@@ -312,14 +312,13 @@ If you use the proposed metric (SharpeRatio@k) or refer to our findings in your
 
     | Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.
     | **Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation**
-    | (a preprint is coming soon..)
 
     .. code-block::
 
         @article{kiyohara2023towards,
             title={Towards Assessing and Benchmarking Risk-Return Tradeoff of Off-Policy Evaluation},
             author={Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nakata, Kazuhide and Saito, Yuta},
-            journal={arXiv preprint arXiv:23xx.xxxxx},
+            journal={arXiv preprint arXiv:2311.18207},
             year={2023}
         }
 

diff --git a/docs/index.rst b/docs/index.rst
@@ -299,14 +299,13 @@ If you use our pipeline in your work, please cite our paper below.
 
     | Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.
     | **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**
-    | (a preprint is coming soon..)
 
     .. code-block::
 
         @article{kiyohara2023scope,
             title={SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
             author={Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nakata, Kazuhide and Saito, Yuta},
-            journal={arXiv preprint arXiv:23xx.xxxxx},
+            journal={arXiv preprint arXiv:2311.18206},
             year={2023}
         }
 

diff --git a/recgym/README.md b/recgym/README.md
@@ -230,14 +230,13 @@ If you use our software in your work, please cite our paper:
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year = {2023},
 }
 ```

diff --git a/recgym/README_ja.md b/recgym/README_ja.md
@@ -228,14 +228,13 @@ class CustomizedUserModel(BaseUserModel):
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year = {2023},
 }
 ```

diff --git a/rtbgym/README.md b/rtbgym/README.md
@@ -363,14 +363,13 @@ If you use our software in your work, please cite our paper:
 
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year = {2023},
 }
 ```

diff --git a/rtbgym/README_ja.md b/rtbgym/README_ja.md
@@ -359,16 +359,16 @@ custom_env = CustomizedRTBEnv(
 ## 引用
 
 ソフトウェアを使用する場合は，以下の論文の引用をお願いします．
+
 Haruka Kiyohara, Ren Kishimoto, Kosuke Kawakami, Ken Kobayashi, Kazuhide Nakata, Yuta Saito.<br>
 **SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation**<br>
-[link]() (a preprint coming soon..)
 
 Bibtex:
 ```
 @article{kiyohara2023scope,
   author = {Kiyohara, Haruka and Kishimoto, Ren and Kawakami, Kosuke and Kobayashi, Ken and Nataka, Kazuhide and Saito, Yuta},
   title = {SCOPE-RL: A Python Library for Offline Reinforcement Learning and Off-Policy Evaluation},
-  journal={arXiv preprint arXiv:23xx.xxxxx},
+  journal={arXiv preprint arXiv:2311.18206},
   year = {2023},
 }
 ```