From 600b8d47299a0c69bf1d09c1172c7735bb7e5d5d Mon Sep 17 00:00:00 2001 From: Rohan Potdar <66227218+Rohan138@users.noreply.github.com> Date: Thu, 11 Aug 2022 12:44:22 +0530 Subject: [PATCH] [RLlib]: Fix OPE docs. (#27460) --- doc/source/rllib/rllib-offline.rst | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/doc/source/rllib/rllib-offline.rst b/doc/source/rllib/rllib-offline.rst index 78aea01c2dd76..8c2ea44a59037 100644 --- a/doc/source/rllib/rllib-offline.rst +++ b/doc/source/rllib/rllib-offline.rst @@ -124,11 +124,11 @@ We can now train a DQN algorithm offline and evaluate it using OPE: "wis": {"type": WeightedImportanceSampling}, "dm_fqe": { "type": DirectMethod, - "q_model_config": {"type": FQETorchModel, "tau": 0.05}, + "q_model_config": {"type": FQETorchModel, "polyak_coef": 0.05}, }, "dr_fqe": { "type": DoublyRobust, - "q_model_config": {"type": FQETorchModel, "tau": 0.05}, + "q_model_config": {"type": FQETorchModel, "polyak_coef": 0.05}, }, }, )