Gymnasium/gym/spaces/high_low.py

from gym import Space
import numpy as np

class HighLow(Space):
    """
    A matrix of dimensions n x 3, where

    - n is the number of options in the space (e.g. buttons that can be pressed simultaneously)
    - u[1] (the first column) is the minimum value (inclusive) that the option can have
    - u[2] (the second column) is the maximum value (inclusive) that the option can have
    - u[3] (the third column) is the precision (0 = rounded to integer, 2 = rounded to 2 decimals)

    e.g. if the space is composed of ATTACK (values: 0-100), MOVE_LEFT(0-1), MOVE_RIGHT(0,1)
    the space would be [ [0.0, 100.0, 2], [0, 1, 0], [0, 1, 0] ]
    """
    def __init__(self, matrix, np_random=None):
        """
        A matrix of shape (n, 3), where the first column is the minimum (inclusive), the second column
        is the maximum (inclusive), and the third column is the precision (number of decimals to keep)

        e.g. np.matrix([[0, 1, 0], [0, 1, 0], [0.0, 100.0, 2]])
        """
        if np_random is None:
            np_random = np.random
        self.np_random = np_random

        (num_rows, num_cols) = matrix.shape
        assert num_rows >= 1
        assert num_cols == 3
        self.matrix = matrix
        self.num_rows = num_rows

    def sample(self):
        # For each row: round(random .* (max - min) + min, precision)
        max_minus_min = self.matrix[:, 1] - self.matrix[:, 0]
        random_matrix = np.multiply(max_minus_min, self.np_random.rand(self.num_rows, 1)) + self.matrix[:, 0]
        rounded_matrix = np.zeros(self.num_rows)
        for i in range(self.num_rows):
            rounded_matrix[i] = round(random_matrix[i, 0], int(self.matrix[i, 2]))
        return rounded_matrix

    def contains(self, x):
        if x.shape[0] != self.num_rows:
            return False
        for i in range(self.num_rows):
            if not (self.matrix[i, 0] <= x[i] <= self.matrix[i, 1]):
                return False
        return True

    def to_jsonable(self, sample_n):
        return np.array(sample_n).tolist()
    def from_jsonable(self, sample_n):
        return [np.asarray(sample) for sample in sample_n]

    @property
    def shape(self):
        return self.matrix.shape
    def __repr__(self):
        return "High-Low" + str(self.shape)
    def __eq__(self, other):
        return self.matrix == other.matrix
Add Doom envs (group key doom) 2016-05-17 00:46:03 -07:00			`from gym import Space`
			`import numpy as np`

			`class HighLow(Space):`
			`"""`
			`A matrix of dimensions n x 3, where`

			`- n is the number of options in the space (e.g. buttons that can be pressed simultaneously)`
			`- u[1] (the first column) is the minimum value (inclusive) that the option can have`
			`- u[2] (the second column) is the maximum value (inclusive) that the option can have`
			`- u[3] (the third column) is the precision (0 = rounded to integer, 2 = rounded to 2 decimals)`

			`e.g. if the space is composed of ATTACK (values: 0-100), MOVE_LEFT(0-1), MOVE_RIGHT(0,1)`
			`the space would be [ [0.0, 100.0, 2], [0, 1, 0], [0, 1, 0] ]`
			`"""`
[WIP] add support for seeding environments (#135) * Make environments seedable * Fix monitor bugs - Set monitor_id before setting the infix. This was a bug that would yield incorrect results with multiple monitors. - Remove extra pid from stats recorder filename. This should be purely cosmetic. * Start uploading seeds in episode_batch * Fix _bigint_from_bytes for python3 * Set seed explicitly in random_agent * Pass through seed argument * Also pass through random state to spaces * Pass random state into the observation/action spaces * Make all _seed methods return the list of used seeds * Switch over to np.random where possible * Start hashing seeds, and also seed doom engine * Fixup seeding determinism in many cases * Seed before loading the ROM * Make seeding more Python3 friendly * Make the MuJoCo skipping a bit more forgiving * Remove debugging PDB calls * Make setInt argument into raw bytes * Validate and upload seeds * Skip box2d * Make seeds smaller, and change representation of seeds in upload * Handle long seeds * Fix RandomAgent example to be deterministic * Handle integer types correctly in Python2 and Python3 * Try caching pip * Try adding swap * Add df and free calls * Bump swap * Bump swap size * Try setting overcommit * Try other sysctls * Try fixing overcommit * Try just setting overcommit_memory=1 * Add explanatory comment * Add what's new section to readme * BUG: Mark ElevatorAction-ram-v0 as non-deterministic for now * Document seed * Move nondetermistic check into spec 2016-05-29 09:07:09 -07:00			`def __init__(self, matrix, np_random=None):`
Add Doom envs (group key doom) 2016-05-17 00:46:03 -07:00			`"""`
			`A matrix of shape (n, 3), where the first column is the minimum (inclusive), the second column`
			`is the maximum (inclusive), and the third column is the precision (number of decimals to keep)`

			`e.g. np.matrix([[0, 1, 0], [0, 1, 0], [0.0, 100.0, 2]])`
			`"""`
[WIP] add support for seeding environments (#135) * Make environments seedable * Fix monitor bugs - Set monitor_id before setting the infix. This was a bug that would yield incorrect results with multiple monitors. - Remove extra pid from stats recorder filename. This should be purely cosmetic. * Start uploading seeds in episode_batch * Fix _bigint_from_bytes for python3 * Set seed explicitly in random_agent * Pass through seed argument * Also pass through random state to spaces * Pass random state into the observation/action spaces * Make all _seed methods return the list of used seeds * Switch over to np.random where possible * Start hashing seeds, and also seed doom engine * Fixup seeding determinism in many cases * Seed before loading the ROM * Make seeding more Python3 friendly * Make the MuJoCo skipping a bit more forgiving * Remove debugging PDB calls * Make setInt argument into raw bytes * Validate and upload seeds * Skip box2d * Make seeds smaller, and change representation of seeds in upload * Handle long seeds * Fix RandomAgent example to be deterministic * Handle integer types correctly in Python2 and Python3 * Try caching pip * Try adding swap * Add df and free calls * Bump swap * Bump swap size * Try setting overcommit * Try other sysctls * Try fixing overcommit * Try just setting overcommit_memory=1 * Add explanatory comment * Add what's new section to readme * BUG: Mark ElevatorAction-ram-v0 as non-deterministic for now * Document seed * Move nondetermistic check into spec 2016-05-29 09:07:09 -07:00			`if np_random is None:`
			`np_random = np.random`
			`self.np_random = np_random`

Add Doom envs (group key doom) 2016-05-17 00:46:03 -07:00			`(num_rows, num_cols) = matrix.shape`
			`assert num_rows >= 1`
			`assert num_cols == 3`
			`self.matrix = matrix`
			`self.num_rows = num_rows`

			`def sample(self):`
			`# For each row: round(random .* (max - min) + min, precision)`
			`max_minus_min = self.matrix[:, 1] - self.matrix[:, 0]`
[WIP] add support for seeding environments (#135) * Make environments seedable * Fix monitor bugs - Set monitor_id before setting the infix. This was a bug that would yield incorrect results with multiple monitors. - Remove extra pid from stats recorder filename. This should be purely cosmetic. * Start uploading seeds in episode_batch * Fix _bigint_from_bytes for python3 * Set seed explicitly in random_agent * Pass through seed argument * Also pass through random state to spaces * Pass random state into the observation/action spaces * Make all _seed methods return the list of used seeds * Switch over to np.random where possible * Start hashing seeds, and also seed doom engine * Fixup seeding determinism in many cases * Seed before loading the ROM * Make seeding more Python3 friendly * Make the MuJoCo skipping a bit more forgiving * Remove debugging PDB calls * Make setInt argument into raw bytes * Validate and upload seeds * Skip box2d * Make seeds smaller, and change representation of seeds in upload * Handle long seeds * Fix RandomAgent example to be deterministic * Handle integer types correctly in Python2 and Python3 * Try caching pip * Try adding swap * Add df and free calls * Bump swap * Bump swap size * Try setting overcommit * Try other sysctls * Try fixing overcommit * Try just setting overcommit_memory=1 * Add explanatory comment * Add what's new section to readme * BUG: Mark ElevatorAction-ram-v0 as non-deterministic for now * Document seed * Move nondetermistic check into spec 2016-05-29 09:07:09 -07:00			`random_matrix = np.multiply(max_minus_min, self.np_random.rand(self.num_rows, 1)) + self.matrix[:, 0]`
Add Doom envs (group key doom) 2016-05-17 00:46:03 -07:00			`rounded_matrix = np.zeros(self.num_rows)`
			`for i in range(self.num_rows):`
			`rounded_matrix[i] = round(random_matrix[i, 0], int(self.matrix[i, 2]))`
			`return rounded_matrix`

			`def contains(self, x):`
			`if x.shape[0] != self.num_rows:`
			`return False`
			`for i in range(self.num_rows):`
			`if not (self.matrix[i, 0] <= x[i] <= self.matrix[i, 1]):`
			`return False`
			`return True`

			`def to_jsonable(self, sample_n):`
			`return np.array(sample_n).tolist()`
			`def from_jsonable(self, sample_n):`
			`return [np.asarray(sample) for sample in sample_n]`

			`@property`
			`def shape(self):`
			`return self.matrix.shape`
			`def __repr__(self):`
			`return "High-Low" + str(self.shape)`
			`def __eq__(self, other):`
			`return self.matrix == other.matrix`