diff --git a/algorithms/offline/cql.py b/algorithms/offline/cql.py index 3b49a05e..099bce29 100644 --- a/algorithms/offline/cql.py +++ b/algorithms/offline/cql.py @@ -54,8 +54,6 @@ class TrainConfig: normalize: bool = True # Normalize states normalize_reward: bool = False # Normalize reward q_n_hidden_layers: int = 3 # Number of hidden layers in Q networks - reward_scale: float = 1.0 # Reward scale for normalization - reward_bias: float = 0.0 # Reward bias for normalization bc_steps: int = int(0) # Number of BC steps at start reward_scale: float = 5.0 # Reward scale for normalization reward_bias: float = -1.0 # Reward bias for normalization