Merge v1.0.0 (#682)

Co-authored-by: Kallinteris Andreas <30759571+Kallinteris-Andreas@users.noreply.github.com> Co-authored-by: Jet <38184875+jjshoots@users.noreply.github.com> Co-authored-by: Omar Younis <42100908+younik@users.noreply.github.com>
2025-08-23 15:04:20 +00:00 · 2023-11-07 13:27:25 +00:00
parent cf5f588433
commit 27f8e85051
256 changed files with 7051 additions and 13421 deletions
--- a/tests/wrappers/test_jax_to_torch.py
+++ b/tests/wrappers/test_jax_to_torch.py
@@ -0,0 +1,112 @@
+"""Test suite for TorchToJax wrapper."""
+
+import numpy as np
+import pytest
+
+
+jax = pytest.importorskip("jax")
+jnp = pytest.importorskip("jax.numpy")
+torch = pytest.importorskip("torch")
+
+from gymnasium.wrappers.jax_to_torch import (  # noqa: E402
+    JaxToTorch,
+    jax_to_torch,
+    torch_to_jax,
+)
+from tests.testing_env import GenericTestEnv  # noqa: E402
+
+
+def torch_data_equivalence(data_1, data_2) -> bool:
+    """Return if two variables are equivalent that might contain ``torch.Tensor``."""
+    if type(data_1) == type(data_2):
+        if isinstance(data_1, dict):
+            return data_1.keys() == data_2.keys() and all(
+                torch_data_equivalence(data_1[k], data_2[k]) for k in data_1.keys()
+            )
+        elif isinstance(data_1, (tuple, list)):
+            return len(data_1) == len(data_2) and all(
+                torch_data_equivalence(o_1, o_2) for o_1, o_2 in zip(data_1, data_2)
+            )
+        elif isinstance(data_1, torch.Tensor):
+            return data_1.shape == data_2.shape and np.allclose(
+                data_1, data_2, atol=0.00001
+            )
+        else:
+            return data_1 == data_2
+    else:
+        return False
+
+
+@pytest.mark.parametrize(
+    "value, expected_value",
+    [
+        (1.0, torch.tensor(1.0)),
+        (2, torch.tensor(2)),
+        ((3.0, 4), (torch.tensor(3.0), torch.tensor(4))),
+        ([3.0, 4], [torch.tensor(3.0), torch.tensor(4)]),
+        (
+            {
+                "a": 6.0,
+                "b": 7,
+            },
+            {"a": torch.tensor(6.0), "b": torch.tensor(7)},
+        ),
+        (torch.tensor(1.0), torch.tensor(1.0)),
+        (torch.tensor([1, 2]), torch.tensor([1, 2])),
+        (torch.tensor([[1.0], [2.0]]), torch.tensor([[1.0], [2.0]])),
+        (
+            {"a": (1, torch.tensor(2.0), torch.tensor([3, 4])), "b": {"c": 5}},
+            {
+                "a": (torch.tensor(1), torch.tensor(2.0), torch.tensor([3, 4])),
+                "b": {"c": torch.tensor(5)},
+            },
+        ),
+    ],
+)
+def test_roundtripping(value, expected_value):
+    """We test numpy -> jax -> numpy as this is direction in the NumpyToJax wrapper."""
+    roundtripped_value = jax_to_torch(torch_to_jax(value))
+    assert torch_data_equivalence(roundtripped_value, expected_value)
+
+
+def _jax_reset_func(self, seed=None, options=None):
+    return jnp.array([1.0, 2.0, 3.0]), {"data": jnp.array([1, 2, 3])}
+
+
+def _jax_step_func(self, action):
+    assert isinstance(action, jax.Array), type(action)
+    return (
+        jnp.array([1, 2, 3]),
+        jnp.array(5.0),
+        jnp.array(True),
+        jnp.array(False),
+        {"data": jnp.array([1.0, 2.0])},
+    )
+
+
+def test_jax_to_torch_wrapper():
+    """Tests the `JaxToTorchV0` wrapper."""
+    env = GenericTestEnv(reset_func=_jax_reset_func, step_func=_jax_step_func)
+
+    # Check that the reset and step for jax environment are as expected
+    obs, info = env.reset()
+    assert isinstance(obs, jax.Array)
+    assert isinstance(info, dict) and isinstance(info["data"], jax.Array)
+
+    obs, reward, terminated, truncated, info = env.step(jnp.array([1, 2]))
+    assert isinstance(obs, jax.Array)
+    assert isinstance(reward, jax.Array)
+    assert isinstance(terminated, jax.Array) and isinstance(truncated, jax.Array)
+    assert isinstance(info, dict) and isinstance(info["data"], jax.Array)
+
+    # Check that the wrapped version is correct.
+    wrapped_env = JaxToTorch(env)
+    obs, info = wrapped_env.reset()
+    assert isinstance(obs, torch.Tensor)
+    assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)
+
+    obs, reward, terminated, truncated, info = wrapped_env.step(torch.tensor([1, 2]))
+    assert isinstance(obs, torch.Tensor)
+    assert isinstance(reward, float)
+    assert isinstance(terminated, bool) and isinstance(truncated, bool)
+    assert isinstance(info, dict) and isinstance(info["data"], torch.Tensor)