Prepare Release v2.0 (#192)
This commit is contained in:
parent
6e1aba45e3
commit
de92025bb2
|
|
@ -3,7 +3,7 @@
|
||||||
Changelog
|
Changelog
|
||||||
==========
|
==========
|
||||||
|
|
||||||
Release 2.0.0a13 (WIP)
|
Release 2.0.0 (2023-06-22)
|
||||||
--------------------------
|
--------------------------
|
||||||
|
|
||||||
**Gymnasium support**
|
**Gymnasium support**
|
||||||
|
|
|
||||||
|
|
@ -4,8 +4,13 @@ line-length = 127
|
||||||
# Assume Python 3.7
|
# Assume Python 3.7
|
||||||
target-version = "py37"
|
target-version = "py37"
|
||||||
select = ["E", "F", "B", "UP", "C90", "RUF"]
|
select = ["E", "F", "B", "UP", "C90", "RUF"]
|
||||||
# Ignore explicit stacklevel`
|
# B028: Ignore explicit stacklevel`
|
||||||
ignore = ["B028"]
|
# RUF013: Too many false positives (implicit optional)
|
||||||
|
ignore = ["B028", "RUF013"]
|
||||||
|
|
||||||
|
[tool.ruff.per-file-ignores]
|
||||||
|
# ClassVar, implicit optional check not needed for tests
|
||||||
|
"./tests/*.py"= ["RUF012", "RUF013"]
|
||||||
|
|
||||||
[tool.ruff.mccabe]
|
[tool.ruff.mccabe]
|
||||||
# Unlike Flake8, ruff default to a complexity level of 10.
|
# Unlike Flake8, ruff default to a complexity level of 10.
|
||||||
|
|
|
||||||
|
|
@ -3,7 +3,7 @@ import sys
|
||||||
import time
|
import time
|
||||||
import warnings
|
import warnings
|
||||||
from functools import partial
|
from functools import partial
|
||||||
from typing import Any, Dict, Optional, Type, TypeVar, Union
|
from typing import Any, ClassVar, Dict, Optional, Type, TypeVar, Union
|
||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import torch as th
|
import torch as th
|
||||||
|
|
@ -50,7 +50,7 @@ class ARS(BaseAlgorithm):
|
||||||
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
||||||
"""
|
"""
|
||||||
|
|
||||||
policy_aliases: Dict[str, Type[BasePolicy]] = {
|
policy_aliases: ClassVar[Dict[str, Type[BasePolicy]]] = {
|
||||||
"MlpPolicy": MlpPolicy,
|
"MlpPolicy": MlpPolicy,
|
||||||
"LinearPolicy": LinearPolicy,
|
"LinearPolicy": LinearPolicy,
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -1,7 +1,7 @@
|
||||||
import sys
|
import sys
|
||||||
import time
|
import time
|
||||||
from collections import deque
|
from collections import deque
|
||||||
from typing import Any, Dict, Optional, Tuple, Type, TypeVar, Union
|
from typing import Any, ClassVar, Dict, Optional, Tuple, Type, TypeVar, Union
|
||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import torch as th
|
import torch as th
|
||||||
|
|
@ -69,7 +69,7 @@ class MaskablePPO(OnPolicyAlgorithm):
|
||||||
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
||||||
"""
|
"""
|
||||||
|
|
||||||
policy_aliases: Dict[str, Type[BasePolicy]] = {
|
policy_aliases: ClassVar[Dict[str, Type[BasePolicy]]] = {
|
||||||
"MlpPolicy": MlpPolicy,
|
"MlpPolicy": MlpPolicy,
|
||||||
"CnnPolicy": CnnPolicy,
|
"CnnPolicy": CnnPolicy,
|
||||||
"MultiInputPolicy": MultiInputPolicy,
|
"MultiInputPolicy": MultiInputPolicy,
|
||||||
|
|
|
||||||
|
|
@ -1,7 +1,7 @@
|
||||||
import sys
|
import sys
|
||||||
import time
|
import time
|
||||||
from copy import deepcopy
|
from copy import deepcopy
|
||||||
from typing import Any, Dict, Optional, Type, TypeVar, Union
|
from typing import Any, ClassVar, Dict, Optional, Type, TypeVar, Union
|
||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import torch as th
|
import torch as th
|
||||||
|
|
@ -67,7 +67,7 @@ class RecurrentPPO(OnPolicyAlgorithm):
|
||||||
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
||||||
"""
|
"""
|
||||||
|
|
||||||
policy_aliases: Dict[str, Type[BasePolicy]] = {
|
policy_aliases: ClassVar[Dict[str, Type[BasePolicy]]] = {
|
||||||
"MlpLstmPolicy": MlpLstmPolicy,
|
"MlpLstmPolicy": MlpLstmPolicy,
|
||||||
"CnnLstmPolicy": CnnLstmPolicy,
|
"CnnLstmPolicy": CnnLstmPolicy,
|
||||||
"MultiInputLstmPolicy": MultiInputLstmPolicy,
|
"MultiInputLstmPolicy": MultiInputLstmPolicy,
|
||||||
|
|
|
||||||
|
|
@ -1,5 +1,5 @@
|
||||||
import warnings
|
import warnings
|
||||||
from typing import Any, Dict, List, Optional, Tuple, Type, TypeVar, Union
|
from typing import Any, ClassVar, Dict, List, Optional, Tuple, Type, TypeVar, Union
|
||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import torch as th
|
import torch as th
|
||||||
|
|
@ -60,7 +60,7 @@ class QRDQN(OffPolicyAlgorithm):
|
||||||
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
||||||
"""
|
"""
|
||||||
|
|
||||||
policy_aliases: Dict[str, Type[BasePolicy]] = {
|
policy_aliases: ClassVar[Dict[str, Type[BasePolicy]]] = {
|
||||||
"MlpPolicy": MlpPolicy,
|
"MlpPolicy": MlpPolicy,
|
||||||
"CnnPolicy": CnnPolicy,
|
"CnnPolicy": CnnPolicy,
|
||||||
"MultiInputPolicy": MultiInputPolicy,
|
"MultiInputPolicy": MultiInputPolicy,
|
||||||
|
|
|
||||||
|
|
@ -1,4 +1,4 @@
|
||||||
from typing import Any, Callable, Dict, List, Optional, Tuple, Type, TypeVar, Union
|
from typing import Any, Callable, ClassVar, Dict, List, Optional, Tuple, Type, TypeVar, Union
|
||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import torch as th
|
import torch as th
|
||||||
|
|
@ -68,7 +68,7 @@ class TQC(OffPolicyAlgorithm):
|
||||||
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
||||||
"""
|
"""
|
||||||
|
|
||||||
policy_aliases: Dict[str, Type[BasePolicy]] = {
|
policy_aliases: ClassVar[Dict[str, Type[BasePolicy]]] = {
|
||||||
"MlpPolicy": MlpPolicy,
|
"MlpPolicy": MlpPolicy,
|
||||||
"CnnPolicy": CnnPolicy,
|
"CnnPolicy": CnnPolicy,
|
||||||
"MultiInputPolicy": MultiInputPolicy,
|
"MultiInputPolicy": MultiInputPolicy,
|
||||||
|
|
|
||||||
|
|
@ -1,7 +1,7 @@
|
||||||
import copy
|
import copy
|
||||||
import warnings
|
import warnings
|
||||||
from functools import partial
|
from functools import partial
|
||||||
from typing import Any, Dict, List, Optional, Tuple, Type, TypeVar, Union
|
from typing import Any, ClassVar, Dict, List, Optional, Tuple, Type, TypeVar, Union
|
||||||
|
|
||||||
import numpy as np
|
import numpy as np
|
||||||
import torch as th
|
import torch as th
|
||||||
|
|
@ -69,7 +69,7 @@ class TRPO(OnPolicyAlgorithm):
|
||||||
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
:param _init_setup_model: Whether or not to build the network at the creation of the instance
|
||||||
"""
|
"""
|
||||||
|
|
||||||
policy_aliases: Dict[str, Type[BasePolicy]] = {
|
policy_aliases: ClassVar[Dict[str, Type[BasePolicy]]] = {
|
||||||
"MlpPolicy": MlpPolicy,
|
"MlpPolicy": MlpPolicy,
|
||||||
"CnnPolicy": CnnPolicy,
|
"CnnPolicy": CnnPolicy,
|
||||||
"MultiInputPolicy": MultiInputPolicy,
|
"MultiInputPolicy": MultiInputPolicy,
|
||||||
|
|
|
||||||
|
|
@ -1 +1 @@
|
||||||
2.0.0a13
|
2.0.0
|
||||||
|
|
|
||||||
4
setup.py
4
setup.py
|
|
@ -65,7 +65,7 @@ setup(
|
||||||
packages=[package for package in find_packages() if package.startswith("sb3_contrib")],
|
packages=[package for package in find_packages() if package.startswith("sb3_contrib")],
|
||||||
package_data={"sb3_contrib": ["py.typed", "version.txt"]},
|
package_data={"sb3_contrib": ["py.typed", "version.txt"]},
|
||||||
install_requires=[
|
install_requires=[
|
||||||
"stable_baselines3>=2.0.0a13",
|
"stable_baselines3>=2.0.0",
|
||||||
],
|
],
|
||||||
description="Contrib package of Stable Baselines3, experimental code.",
|
description="Contrib package of Stable Baselines3, experimental code.",
|
||||||
author="Antonin Raffin",
|
author="Antonin Raffin",
|
||||||
|
|
@ -82,8 +82,10 @@ setup(
|
||||||
project_urls={
|
project_urls={
|
||||||
"Code": "https://github.com/Stable-Baselines-Team/stable-baselines3-contrib",
|
"Code": "https://github.com/Stable-Baselines-Team/stable-baselines3-contrib",
|
||||||
"Documentation": "https://sb3-contrib.readthedocs.io/",
|
"Documentation": "https://sb3-contrib.readthedocs.io/",
|
||||||
|
"Changelog": "https://stable-baselines3.readthedocs.io/en/master/misc/changelog.html",
|
||||||
"Stable-Baselines3": "https://github.com/DLR-RM/stable-baselines3",
|
"Stable-Baselines3": "https://github.com/DLR-RM/stable-baselines3",
|
||||||
"RL-Zoo": "https://github.com/DLR-RM/rl-baselines3-zoo",
|
"RL-Zoo": "https://github.com/DLR-RM/rl-baselines3-zoo",
|
||||||
|
"SBX": "https://github.com/araffin/sbx",
|
||||||
},
|
},
|
||||||
classifiers=[
|
classifiers=[
|
||||||
"Programming Language :: Python :: 3",
|
"Programming Language :: Python :: 3",
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue