Gymnasium/tests/wrappers/test_jax_to_torch.py

"""Test suite for TorchToJax wrapper."""
from typing import NamedTuple

import numpy as np
import pytest


jax = pytest.importorskip("jax")
jnp = pytest.importorskip("jax.numpy")
torch = pytest.importorskip("torch")

from gymnasium.wrappers.jax_to_torch import (  # noqa: E402
    JaxToTorch,
    jax_to_torch,
    torch_to_jax,
)
from tests.testing_env import GenericTestEnv  # noqa: E402


def torch_data_equivalence(data_1, data_2) -> bool:
    """Return if two variables are equivalent that might contain ``torch.Tensor``."""
    if type(data_1) == type(data_2):
        if isinstance(data_1, dict):
            return data_1.keys() == data_2.keys() and all(
                torch_data_equivalence(data_1[k], data_2[k]) for k in data_1.keys()
            )
        elif isinstance(data_1, (tuple, list)):
            return len(data_1) == len(data_2) and all(
                torch_data_equivalence(o_1, o_2) for o_1, o_2 in zip(data_1, data_2)
            )
        elif isinstance(data_1, torch.Tensor):
            return data_1.shape == data_2.shape and np.allclose(
                data_1, data_2, atol=0.00001
            )
        else:
            return data_1 == data_2
    else:
        return False


class ExampleNamedTuple(NamedTuple):
    a: torch.Tensor
    b: torch.Tensor


@pytest.mark.parametrize(
    "value, expected_value",
    [
        (1.0, torch.tensor(1.0)),
        (2, torch.tensor(2)),
        ((3.0, 4), (torch.tensor(3.0), torch.tensor(4))),
        ([3.0, 4], [torch.tensor(3.0), torch.tensor(4)]),
        (
            {
                "a": 6.0,
                "b": 7,
            },
            {"a": torch.tensor(6.0), "b": torch.tensor(7)},
        ),
        (torch.tensor(1.0), torch.tensor(1.0)),
        (torch.tensor(1.0), torch.tensor(1.0)),
        (torch.tensor([1, 2]), torch.tensor([1, 2])),
        (
            torch.tensor([[1.0], [2.0]]),
            torch.tensor([[1.0], [2.0]]),
        ),
        (
            {
                "a": (
                    1,
                    torch.tensor(2.0),
                    torch.tensor([3, 4]),
                ),
                "b": {"c": 5},
            },
            {
                "a": (
                    torch.tensor(1),
                    torch.tensor(2.0),
                    torch.tensor([3, 4]),
                ),
                "b": {"c": torch.tensor(5)},
            },
        ),
        (
            ExampleNamedTuple(
                a=torch.tensor([1, 2]),
                b=torch.tensor([1.0, 2.0]),
            ),
            ExampleNamedTuple(
                a=torch.tensor([1, 2]),
                b=torch.tensor([1.0, 2.0]),
            ),
        ),
    ],
)
def test_roundtripping(value, expected_value):
    """We test numpy -> jax -> numpy as this is direction in the NumpyToJax wrapper."""
    print(f"{value=}")
    print(f"{torch_to_jax(value)=}")
    print(f"{jax_to_torch(torch_to_jax(value))=}")
    roundtripped_value = jax_to_torch(torch_to_jax(value))
    assert torch_data_equivalence(roundtripped_value, expected_value)


def _jax_reset_func(self, seed=None, options=None):
    return jnp.array([1.0, 2.0, 3.0]), {"data": jnp.array([1, 2, 3])}


def _jax_step_func(self, action):
    assert isinstance(action, jax.Array), type(action)
    return (
        jnp.array([1, 2, 3]),
        jnp.array(5.0),
        jnp.array(True),
        jnp.array(False),
        {"data": jnp.array([1.0, 2.0])},
    )


def test_jax_to_torch_wrapper():
    """Tests the `JaxToTorchV0` wrapper."""
    env = GenericTestEnv(reset_func=_jax_reset_func, step_func=_jax_step_func)

    # Check that the reset and step for jax environment are as expected
    obs, info = env.reset()
    assert isinstance(obs, jax.Array)
    assert isinstance(info, dict) and isinstance(info["data"], jax.Array)

    obs, reward, terminated, truncated, info = env.step(jnp.array([1, 2]))
    assert isinstance(obs, jax.Array)
    assert isinstance(reward, jax.Array)
    assert isinstance(terminated, jax.Array) and isinstance(truncated, jax.Array)
    assert isinstance(info, dict) and isinstance(info["data"], jax.Array)

    # Check that the wrapped version is correct.
    wrapped_env = JaxToTorch(env)
    obs, info = wrapped_env.reset()
    assert isinstance(obs, torch.Tensor)
    assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)

    obs, reward, terminated, truncated, info = wrapped_env.step(torch.tensor([1, 2]))
    assert isinstance(obs, torch.Tensor)
    assert isinstance(reward, float)
    assert isinstance(terminated, bool) and isinstance(truncated, bool)
    assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`"""Test suite for TorchToJax wrapper."""`
Add support for NamedTuple in jax->torch and numpy->torch (#811) 2023-12-04 12:14:19 +00:00			`from typing import NamedTuple`
Add wrappers to experimental (#201) 2022-12-10 22:04:14 +00:00
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`import numpy as np`
			`import pytest`

Skip Jax and PyTorch tests if module is missing (#466) 2023-04-25 03:47:51 -07:00
Add changes to support Jax 0.4 (#373) 2023-07-03 23:53:57 +02:00			`jax = pytest.importorskip("jax")`
Skip Jax and PyTorch tests if module is missing (#466) 2023-04-25 03:47:51 -07:00			`jnp = pytest.importorskip("jax.numpy")`
			`torch = pytest.importorskip("torch")`

Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`from gymnasium.wrappers.jax_to_torch import ( # noqa: E402`
			`JaxToTorch,`
Properly hide additional requirements between separate imports (#323) Co-authored-by: Mark Towers <mark.m.towers@gmail.com> 2023-02-14 15:03:38 -05:00			`jax_to_torch,`
			`torch_to_jax,`
			`)`
Skip Jax and PyTorch tests if module is missing (#466) 2023-04-25 03:47:51 -07:00			`from tests.testing_env import GenericTestEnv # noqa: E402`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00

			`def torch_data_equivalence(data_1, data_2) -> bool:`
Update experimental wrappers (#176) 2022-12-05 19:14:56 +00:00			"""Return if two variables are equivalent that might contain ``torch.Tensor``."""
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`if type(data_1) == type(data_2):`
			`if isinstance(data_1, dict):`
			`return data_1.keys() == data_2.keys() and all(`
			`torch_data_equivalence(data_1[k], data_2[k]) for k in data_1.keys()`
			`)`
			`elif isinstance(data_1, (tuple, list)):`
			`return len(data_1) == len(data_2) and all(`
			`torch_data_equivalence(o_1, o_2) for o_1, o_2 in zip(data_1, data_2)`
			`)`
			`elif isinstance(data_1, torch.Tensor):`
			`return data_1.shape == data_2.shape and np.allclose(`
			`data_1, data_2, atol=0.00001`
			`)`
			`else:`
			`return data_1 == data_2`
			`else:`
			`return False`


Add support for NamedTuple in jax->torch and numpy->torch (#811) 2023-12-04 12:14:19 +00:00			`class ExampleNamedTuple(NamedTuple):`
			`a: torch.Tensor`
			`b: torch.Tensor`


Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`@pytest.mark.parametrize(`
			`"value, expected_value",`
			`[`
			`(1.0, torch.tensor(1.0)),`
			`(2, torch.tensor(2)),`
			`((3.0, 4), (torch.tensor(3.0), torch.tensor(4))),`
			`([3.0, 4], [torch.tensor(3.0), torch.tensor(4)]),`
			`(`
			`{`
			`"a": 6.0,`
			`"b": 7,`
			`},`
			`{"a": torch.tensor(6.0), "b": torch.tensor(7)},`
			`),`
			`(torch.tensor(1.0), torch.tensor(1.0)),`
Add support for NamedTuple in jax->torch and numpy->torch (#811) 2023-12-04 12:14:19 +00:00			`(torch.tensor(1.0), torch.tensor(1.0)),`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`(torch.tensor([1, 2]), torch.tensor([1, 2])),`
			`(`
Add support for NamedTuple in jax->torch and numpy->torch (#811) 2023-12-04 12:14:19 +00:00			`torch.tensor([[1.0], [2.0]]),`
			`torch.tensor([[1.0], [2.0]]),`
			`),`
			`(`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`{`
Add support for NamedTuple in jax->torch and numpy->torch (#811) 2023-12-04 12:14:19 +00:00			`"a": (`
			`1,`
			`torch.tensor(2.0),`
			`torch.tensor([3, 4]),`
			`),`
			`"b": {"c": 5},`
			`},`
			`{`
			`"a": (`
			`torch.tensor(1),`
			`torch.tensor(2.0),`
			`torch.tensor([3, 4]),`
			`),`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`"b": {"c": torch.tensor(5)},`
			`},`
			`),`
Add support for NamedTuple in jax->torch and numpy->torch (#811) 2023-12-04 12:14:19 +00:00			`(`
			`ExampleNamedTuple(`
			`a=torch.tensor([1, 2]),`
			`b=torch.tensor([1.0, 2.0]),`
			`),`
			`ExampleNamedTuple(`
			`a=torch.tensor([1, 2]),`
			`b=torch.tensor([1.0, 2.0]),`
			`),`
			`),`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`],`
			`)`
			`def test_roundtripping(value, expected_value):`
			`"""We test numpy -> jax -> numpy as this is direction in the NumpyToJax wrapper."""`
Add support for NamedTuple in jax->torch and numpy->torch (#811) 2023-12-04 12:14:19 +00:00			`print(f"{value=}")`
			`print(f"{torch_to_jax(value)=}")`
			`print(f"{jax_to_torch(torch_to_jax(value))=}")`
Update experimental wrappers (#176) 2022-12-05 19:14:56 +00:00			`roundtripped_value = jax_to_torch(torch_to_jax(value))`
			`assert torch_data_equivalence(roundtripped_value, expected_value)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00

Update experimental wrappers (#176) 2022-12-05 19:14:56 +00:00			`def _jax_reset_func(self, seed=None, options=None):`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`return jnp.array([1.0, 2.0, 3.0]), {"data": jnp.array([1, 2, 3])}`


Update experimental wrappers (#176) 2022-12-05 19:14:56 +00:00			`def _jax_step_func(self, action):`
Add changes to support Jax 0.4 (#373) 2023-07-03 23:53:57 +02:00			`assert isinstance(action, jax.Array), type(action)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`return (`
			`jnp.array([1, 2, 3]),`
			`jnp.array(5.0),`
			`jnp.array(True),`
			`jnp.array(False),`
			`{"data": jnp.array([1.0, 2.0])},`
			`)`


Add wrappers to experimental (#201) 2022-12-10 22:04:14 +00:00			`def test_jax_to_torch_wrapper():`
			"""Tests the `JaxToTorchV0` wrapper."""
Update experimental wrappers (#176) 2022-12-05 19:14:56 +00:00			`env = GenericTestEnv(reset_func=_jax_reset_func, step_func=_jax_step_func)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00
			`# Check that the reset and step for jax environment are as expected`
			`obs, info = env.reset()`
Add changes to support Jax 0.4 (#373) 2023-07-03 23:53:57 +02:00			`assert isinstance(obs, jax.Array)`
			`assert isinstance(info, dict) and isinstance(info["data"], jax.Array)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00
			`obs, reward, terminated, truncated, info = env.step(jnp.array([1, 2]))`
Add changes to support Jax 0.4 (#373) 2023-07-03 23:53:57 +02:00			`assert isinstance(obs, jax.Array)`
			`assert isinstance(reward, jax.Array)`
			`assert isinstance(terminated, jax.Array) and isinstance(truncated, jax.Array)`
			`assert isinstance(info, dict) and isinstance(info["data"], jax.Array)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00
			`# Check that the wrapped version is correct.`
Merge v1.0.0 (#682) Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com> 2023-11-07 13:27:25 +00:00			`wrapped_env = JaxToTorch(env)`
Adds wrappers for jax environments converting to numpy and pytorch (#168) Co-authored-by: Justin Deutsch <djustin8@vt.edu> Co-authored-by: Gianluca De Cola <42657588+gianlucadecola@users.noreply.github.com> 2022-12-03 19:46:01 +00:00			`obs, info = wrapped_env.reset()`
			`assert isinstance(obs, torch.Tensor)`
			`assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)`

			`obs, reward, terminated, truncated, info = wrapped_env.step(torch.tensor([1, 2]))`
			`assert isinstance(obs, torch.Tensor)`
			`assert isinstance(reward, float)`
			`assert isinstance(terminated, bool) and isinstance(truncated, bool)`
			`assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)`