Gymnasium/tests/wrappers/test_numpy_to_torch.py

"""Test suite for NumPyToTorch wrapper."""

import numpy as np
import pytest


torch = pytest.importorskip("torch")


from gymnasium.utils.env_checker import data_equivalence  # noqa: E402
from gymnasium.wrappers.numpy_to_torch import (  # noqa: E402
    NumpyToTorch,
    numpy_to_torch,
    torch_to_numpy,
)
from tests.testing_env import GenericTestEnv  # noqa: E402


@pytest.mark.parametrize(
    "value, expected_value",
    [
        (1.0, np.array(1.0, dtype=np.float32)),
        (2, np.array(2, dtype=np.int64)),
        ((3.0, 4), (np.array(3.0, dtype=np.float32), np.array(4, dtype=np.int64))),
        ([3.0, 4], [np.array(3.0, dtype=np.float32), np.array(4, dtype=np.int64)]),
        (
            {
                "a": 6.0,
                "b": 7,
            },
            {"a": np.array(6.0, dtype=np.float32), "b": np.array(7, dtype=np.int64)},
        ),
        (np.array(1.0, dtype=np.float32), np.array(1.0, dtype=np.float32)),
        (np.array(1.0, dtype=np.uint8), np.array(1.0, dtype=np.uint8)),
        (np.array([1, 2], dtype=np.int32), np.array([1, 2], dtype=np.int32)),
        (
            np.array([[1.0], [2.0]], dtype=np.int32),
            np.array([[1.0], [2.0]], dtype=np.int32),
        ),
        (
            {
                "a": (
                    1,
                    np.array(2.0, dtype=np.float32),
                    np.array([3, 4], dtype=np.int32),
                ),
                "b": {"c": 5},
            },
            {
                "a": (
                    np.array(1, dtype=np.int64),
                    np.array(2.0, dtype=np.float32),
                    np.array([3, 4], dtype=np.int32),
                ),
                "b": {"c": np.array(5, dtype=np.int64)},
            },
        ),
    ],
)
def test_roundtripping(value, expected_value):
    """We test numpy -> torch -> numpy as this is direction in the NumpyToTorch wrapper."""
    torch_value = numpy_to_torch(value)
    roundtripped_value = torch_to_numpy(torch_value)
    # roundtripped_value = torch_to_numpy(numpy_to_torch(value))
    assert data_equivalence(roundtripped_value, expected_value)


def numpy_reset_func(self, seed=None, options=None):
    """A Numpy-based reset function."""
    return np.array([1.0, 2.0, 3.0]), {"data": np.array([1, 2, 3])}


def numpy_step_func(self, action):
    """A Numpy-based step function."""
    assert isinstance(action, np.ndarray), type(action)
    return (
        np.array([1, 2, 3]),
        5.0,
        True,
        False,
        {"data": np.array([1.0, 2.0])},
    )


def test_numpy_to_torch():
    """Tests the ``TorchToNumpy`` wrapper."""
    numpy_env = GenericTestEnv(reset_func=numpy_reset_func, step_func=numpy_step_func)
    obs, info = numpy_env.reset()
    assert isinstance(obs, np.ndarray)
    assert isinstance(info, dict) and isinstance(info["data"], np.ndarray)

    obs, reward, terminated, truncated, info = numpy_env.step(np.array([1, 2]))
    assert isinstance(obs, np.ndarray)
    assert isinstance(reward, float)
    assert isinstance(terminated, bool) and isinstance(truncated, bool)
    assert isinstance(info, dict) and isinstance(info["data"], np.ndarray)

    # Check that the wrapped version is correct.
    torch_env = NumpyToTorch(numpy_env)

    # Check that the reset and step for torch environment are as expected
    obs, info = torch_env.reset()
    assert isinstance(obs, torch.Tensor)
    assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)

    obs, reward, terminated, truncated, info = torch_env.step(torch.tensor([1, 2]))
    assert isinstance(obs, torch.Tensor)
    assert isinstance(reward, float)
    assert isinstance(terminated, bool) and isinstance(truncated, bool)
    assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`"""Test suite for NumPyToTorch wrapper."""`
Add wrappers to experimental (#201) 2022-12-10 22:04:14 +00:00
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`import numpy as np`
			`import pytest`

Skip Jax and PyTorch tests if module is missing (#466) 2023-04-25 03:47:51 -07:00
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`torch = pytest.importorskip("torch")`

Skip Jax and PyTorch tests if module is missing (#466) 2023-04-25 03:47:51 -07:00
			`from gymnasium.utils.env_checker import data_equivalence # noqa: E402`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`from gymnasium.wrappers.numpy_to_torch import ( # noqa: E402`
			`NumpyToTorch,`
			`numpy_to_torch,`
			`torch_to_numpy,`
			`)`
Skip Jax and PyTorch tests if module is missing (#466) 2023-04-25 03:47:51 -07:00			`from tests.testing_env import GenericTestEnv # noqa: E402`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00

			`@pytest.mark.parametrize(`
			`"value, expected_value",`
			`[`
Add dtype testing for `data_equivalence` and update testing (#515) 2023-05-23 17:03:25 +01:00			`(1.0, np.array(1.0, dtype=np.float32)),`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`(2, np.array(2, dtype=np.int64)),`
			`((3.0, 4), (np.array(3.0, dtype=np.float32), np.array(4, dtype=np.int64))),`
			`([3.0, 4], [np.array(3.0, dtype=np.float32), np.array(4, dtype=np.int64)]),`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`(`
			`{`
			`"a": 6.0,`
			`"b": 7,`
			`},`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`{"a": np.array(6.0, dtype=np.float32), "b": np.array(7, dtype=np.int64)},`
Add dtype testing for `data_equivalence` and update testing (#515) 2023-05-23 17:03:25 +01:00			`),`
			`(np.array(1.0, dtype=np.float32), np.array(1.0, dtype=np.float32)),`
			`(np.array(1.0, dtype=np.uint8), np.array(1.0, dtype=np.uint8)),`
			`(np.array([1, 2], dtype=np.int32), np.array([1, 2], dtype=np.int32)),`
			`(`
			`np.array([[1.0], [2.0]], dtype=np.int32),`
			`np.array([[1.0], [2.0]], dtype=np.int32),`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`),`
			`(`
			`{`
Add dtype testing for `data_equivalence` and update testing (#515) 2023-05-23 17:03:25 +01:00			`"a": (`
			`1,`
			`np.array(2.0, dtype=np.float32),`
			`np.array([3, 4], dtype=np.int32),`
			`),`
			`"b": {"c": 5},`
			`},`
			`{`
			`"a": (`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`np.array(1, dtype=np.int64),`
Add dtype testing for `data_equivalence` and update testing (#515) 2023-05-23 17:03:25 +01:00			`np.array(2.0, dtype=np.float32),`
			`np.array([3, 4], dtype=np.int32),`
			`),`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`"b": {"c": np.array(5, dtype=np.int64)},`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`},`
			`),`
			`],`
			`)`
			`def test_roundtripping(value, expected_value):`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`"""We test numpy -> torch -> numpy as this is direction in the NumpyToTorch wrapper."""`
			`torch_value = numpy_to_torch(value)`
			`roundtripped_value = torch_to_numpy(torch_value)`
			`# roundtripped_value = torch_to_numpy(numpy_to_torch(value))`
Add dtype testing for `data_equivalence` and update testing (#515) 2023-05-23 17:03:25 +01:00			`assert data_equivalence(roundtripped_value, expected_value)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00

Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`def numpy_reset_func(self, seed=None, options=None):`
			`"""A Numpy-based reset function."""`
			`return np.array([1.0, 2.0, 3.0]), {"data": np.array([1, 2, 3])}`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00

Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`def numpy_step_func(self, action):`
			`"""A Numpy-based step function."""`
			`assert isinstance(action, np.ndarray), type(action)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`return (`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`np.array([1, 2, 3]),`
			`5.0,`
			`True,`
			`False,`
			`{"data": np.array([1.0, 2.0])},`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`)`


Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`def test_numpy_to_torch():`
			"""Tests the ``TorchToNumpy`` wrapper."""
			`numpy_env = GenericTestEnv(reset_func=numpy_reset_func, step_func=numpy_step_func)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`obs, info = numpy_env.reset()`
			`assert isinstance(obs, np.ndarray)`
			`assert isinstance(info, dict) and isinstance(info["data"], np.ndarray)`

			`obs, reward, terminated, truncated, info = numpy_env.step(np.array([1, 2]))`
			`assert isinstance(obs, np.ndarray)`
			`assert isinstance(reward, float)`
			`assert isinstance(terminated, bool) and isinstance(truncated, bool)`
			`assert isinstance(info, dict) and isinstance(info["data"], np.ndarray)`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00
			`# Check that the wrapped version is correct.`
			`torch_env = NumpyToTorch(numpy_env)`

			`# Check that the reset and step for torch environment are as expected`
			`obs, info = torch_env.reset()`
			`assert isinstance(obs, torch.Tensor)`
			`assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)`

			`obs, reward, terminated, truncated, info = torch_env.step(torch.tensor([1, 2]))`
			`assert isinstance(obs, torch.Tensor)`
			`assert isinstance(reward, float)`
			`assert isinstance(terminated, bool) and isinstance(truncated, bool)`
			`assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)`