From 857a087a2afc6a16d50b93370b1c56ff24335951 Mon Sep 17 00:00:00 2001 From: Antonin RAFFIN Date: Tue, 8 Dec 2020 15:35:50 +0100 Subject: [PATCH] Update TQC to match SB3 (#14) --- docs/misc/changelog.rst | 3 ++- sb3_contrib/tqc/tqc.py | 2 ++ sb3_contrib/version.txt | 2 +- 3 files changed, 5 insertions(+), 2 deletions(-) diff --git a/docs/misc/changelog.rst b/docs/misc/changelog.rst index 5302fa0..0f0cc13 100644 --- a/docs/misc/changelog.rst +++ b/docs/misc/changelog.rst @@ -4,7 +4,7 @@ Changelog ========== -Pre-Release 0.11.0a0 (WIP) +Pre-Release 0.11.0a2 (WIP) ------------------------------- Breaking Changes: @@ -22,6 +22,7 @@ Deprecations: Others: ^^^^^^^ +- Updated ``TQC`` to match new SB3 version Documentation: ^^^^^^^^^^^^^^ diff --git a/sb3_contrib/tqc/tqc.py b/sb3_contrib/tqc/tqc.py index d8fd647..5ef9f10 100644 --- a/sb3_contrib/tqc/tqc.py +++ b/sb3_contrib/tqc/tqc.py @@ -1,5 +1,6 @@ from typing import Any, Callable, Dict, List, Optional, Tuple, Type, Union +import gym import numpy as np import torch as th from stable_baselines3.common import logger @@ -114,6 +115,7 @@ class TQC(OffPolicyAlgorithm): sde_sample_freq=sde_sample_freq, use_sde_at_warmup=use_sde_at_warmup, optimize_memory_usage=optimize_memory_usage, + supported_action_spaces=(gym.spaces.Box), ) self.target_entropy = target_entropy diff --git a/sb3_contrib/version.txt b/sb3_contrib/version.txt index d22e31d..a09c7eb 100644 --- a/sb3_contrib/version.txt +++ b/sb3_contrib/version.txt @@ -1 +1 @@ -0.11.0a0 +0.11.0a2