MAJOR: Added image_representations for cont. envs, removed some bugs and minor improvements

RaghuSpaceRajan · RaghuSpaceRajan · commit 3a17423ae0be · 2021-05-28T21:48:58.000+02:00
diff --git a/example.py b/example.py
@@ -25,7 +25,7 @@ def discrete_environment_example():
     config["seed"] = 0
 
     config["state_space_type"] = "discrete"
-    config["state_space_size"] = 8
+    config["action_space_size"] = 8
     config["delay"] = 1
     config["sequence_length"] = 3
     config["reward_scale"] = 2.5
@@ -59,7 +59,7 @@ def discrete_environment_image_representations_example():
     config["seed"] = 0
 
     config["state_space_type"] = "discrete"
-    config["state_space_size"] = 8
+    config["action_space_size"] = 8
     config["image_representations"] = True
     config["delay"] = 1
     config["sequence_length"] = 3
diff --git a/mdp_playground/envs/rl_toy_env.py b/mdp_playground/envs/rl_toy_env.py
diff --git a/mdp_playground/spaces/__init__.py b/mdp_playground/spaces/__init__.py
@@ -2,6 +2,8 @@
 from mdp_playground.spaces.box_extended import BoxExtended
 from mdp_playground.spaces.multi_discrete_extended import MultiDiscreteExtended
 from mdp_playground.spaces.image_multi_discrete import ImageMultiDiscrete
+from mdp_playground.spaces.image_continuous import ImageContinuous
 from mdp_playground.spaces.tuple_extended import TupleExtended
 
-__all__ = ["BoxExtended", "DiscreteExtended", "MultiDiscreteExtended", "ImageMultiDiscrete", "TupleExtended"]
+__all__ = ["BoxExtended", "DiscreteExtended", "MultiDiscreteExtended",\
+            "ImageMultiDiscrete", "ImageContinuous", "TupleExtended"]
diff --git a/mdp_playground/spaces/image_continuous.py b/mdp_playground/spaces/image_continuous.py
@@ -0,0 +1,194 @@
+import warnings
+import numpy as np
+import gym
+from gym.spaces import Box, Space
+import PIL.ImageDraw as ImageDraw
+import PIL.Image as Image
+from PIL.Image import FLIP_LEFT_RIGHT, FLIP_TOP_BOTTOM
+import os
+
+class ImageContinuous(Box):
+    '''A space that maps a continuous 1- or 2-D space 1-to-1 to images so that the
+    images may be used as representations for corresponding continuous environments.
+
+    Methods
+    -------
+    get_concatenated_image(continuous_obs)
+        Gets an image representation for a given feature space observation
+    '''
+
+    def __init__(self, feature_space, term_spaces=None, width=100, height=100,\
+                circle_radius=5, target_point=None, relevant_indices=[0,1],\
+                seed=None, use_custom_images=None, cust_path=None, dtype=np.uint8):
+        '''
+        Parameters
+        ----------
+        feature_space : Gym.spaces.Box
+            The feature space to which this class associates images as external
+            observations
+        term_spaces : list of Gym.spaces.Box
+            Sub-spaces of the feature space which are terminal
+        width : int
+            The width of the image
+        height : int
+            The height of the image
+        circle_radius : int
+            The radius of the circle which represents the agent and target point
+        target_point : np.array
+
+        relevant_indices : list
+
+        seed : int
+            Seed for this space
+        '''
+        # ##TODO Define a common superclass for this and ImageMultiDiscrete
+        self.feature_space = feature_space
+        assert (self.feature_space.high != np.inf).any()
+        assert (self.feature_space.low != -np.inf).any()
+        self.width = width
+        self.height = height
+        # Warn if resolution is too low?
+        self.circle_radius = circle_radius
+        self.target_point = target_point
+        self.term_spaces = term_spaces
+        self.relevant_indices = relevant_indices
+        all_indices = set(range(self.feature_space.shape[0]))
+        self.irrelevant_indices = list(all_indices - set(self.relevant_indices))
+        if len(self.irrelevant_indices) == 0:
+            self.irrelevant_features = False
+        else:
+            self.irrelevant_features = True
+
+        self.goal_colour = (0, 255, 0)
+        self.agent_colour = (0, 0, 255)
+        self.term_colour = (0, 0, 0)
+
+        assert len(feature_space.shape) == 1
+        relevant_dims = len(relevant_indices)
+        irr_dims = len(self.irrelevant_indices)
+        assert relevant_dims <= 2 and irr_dims <=2, "Image observations are "\
+                "supported only "\
+                "for 1- or 2-D feature spaces."
+
+
+        # Shape has 1 appended for Ray Rllib to be compatible IIRC
+        super(ImageContinuous, self).__init__(shape=(width, height, 1), \
+                dtype=dtype, low=0, high=255)
+        super(ImageContinuous, self).seed(seed=seed)
+
+        if self.target_point is not None:
+            self.target_point_pixel = self.convert_to_pixel(target_point)
+
+
+    def generate_image(self, position, relevant=True):
+        '''
+        Parameters
+        ----------
+        position : np.array
+
+        '''
+        # Use RGB
+        image_ = Image.new("RGB", (self.width, self.height), color=(255,255,255))
+        # Use L for black and white 8-bit pixels instead of RGB in case not
+        # using custom images
+        # image_ = Image.new("L", (self.width, self.height))
+        draw = ImageDraw.Draw(image_)
+
+        # Draw term_spaces first, so that others are drawn over it
+        if self.term_spaces is not None and relevant:
+            for term_space in self.term_spaces:
+                low = self.convert_to_pixel(term_space.low)
+                high = self.convert_to_pixel(term_space.high)
+
+                leftUpPoint = tuple((low))
+                rightDownPoint = tuple((high))
+                twoPointList = [leftUpPoint, rightDownPoint]
+                draw.rectangle(twoPointList, fill=self.term_colour)
+
+        R = self.circle_radius
+
+        if self.target_point is not None and relevant:
+            # print("draw2", self.target_point_pixel)
+            leftUpPoint = tuple((self.target_point_pixel - R))
+            rightDownPoint = tuple((self.target_point_pixel + R))
+            twoPointList = [leftUpPoint, rightDownPoint]
+            draw.ellipse(twoPointList, fill=self.goal_colour)
+
+        pos_pixel = self.convert_to_pixel(position)
+        # print("draw1", pos_pixel)
+        # Draw circle https://stackoverflow.com/a/2980931/11063709
+        leftUpPoint = tuple(pos_pixel - R)
+        rightDownPoint = tuple(pos_pixel + R)
+        twoPointList = [leftUpPoint, rightDownPoint]
+        draw.ellipse(twoPointList, fill=self.agent_colour)
+
+
+
+
+        # Because numpy is row-major and Image is column major, need to transpose
+        # ret_arr = np.array(image_).T # For 2-D
+        ret_arr = np.transpose(np.array(image_), axes=(1, 0, 2))
+
+        return ret_arr
+
+    def get_concatenated_image(self, obs):
+        '''Gets the "stitched together" image made from images corresponding to
+        each continuous sub-space within the continuous space, concatenated
+        along the X-axis.
+        '''
+        concatenated_image = []
+        # For relevant/irrelevant sub-spaces:
+        concatenated_image.append(self.generate_image(obs[self.relevant_indices]))
+        if self.irrelevant_features:
+            irr_image = self.generate_image(obs[self.irrelevant_indices], relevant=False)
+            concatenated_image.append(irr_image)
+
+        concatenated_image = np.concatenate(tuple(concatenated_image), axis=0)
+
+        return np.atleast_3d(concatenated_image) # because Ray expects an
+        # image to have >=3 dims
+
+    def convert_to_pixel(self, position):
+        '''
+        '''
+        # It's implicit that both relevant and irrelevant sub-spaces have the
+        # same max and min here:
+        max = self.feature_space.high[self.relevant_indices]
+        min = self.feature_space.low[self.relevant_indices]
+        pos_pixel = ((position - min) / (max - min))
+        pos_pixel = (pos_pixel * self.shape[:2]).astype(int)
+
+        return pos_pixel
+
+
+    def sample(self):
+
+        sampled = self.feature_space.sample()
+        return self.get_concatenated_image(sampled)
+
+    def __repr__(self):
+        return "{} with continuous underlying space of shape: {} and "\
+                "images of resolution: {} and dtype: {}".format(self.__class__,\
+                self.feature_space.shape,\
+                self.shape, self.dtype)
+
+    def contains(self, x):
+        """
+        Return boolean specifying if x is a valid
+        member of this space
+        """
+        if x.shape == (self.width, self.height, 1): #TODO compare each pixel for all possible images?
+            return True
+
+    def to_jsonable(self, sample_n):
+        """Convert a batch of samples from this space to a JSONable data type."""
+        # By default, assume identity is JSONable
+        raise NotImplementedError
+
+    def from_jsonable(self, sample_n):
+        """Convert a JSONable data type to a batch of samples from this space."""
+        # By default, assume identity is JSONable
+        raise NotImplementedError
+
+    def __eq__(self, other):
+        raise NotImplementedError
diff --git a/mdp_playground/spaces/image_multi_discrete.py b/mdp_playground/spaces/image_multi_discrete.py
@@ -16,7 +16,7 @@ class ImageMultiDiscrete(Box):
         Gets an image representation for a given multi_discrete_state
     '''
 
-    def __init__(self, state_space_sizes, width=100, height=100, circle_radius=20, transforms='rotate,flip,scale,shift', sh_quant=1, scale_range=(0.5,1.5), ro_quant=1, seed=None, use_custom_images=None, cust_path=None): # , polygon_sides=4
+    def __init__(self, state_space_sizes, width=100, height=100, circle_radius=20, transforms='rotate,flip,scale,shift', sh_quant=1, scale_range=(0.5,1.5), ro_quant=1, seed=None, use_custom_images=None, cust_path=None, dtype=np.uint8): # , polygon_sides=4
         '''
         Parameters
         ----------
@@ -84,7 +84,7 @@ def __init__(self, state_space_sizes, width=100, height=100, circle_radius=20, t
 
 
         # self.shape = (width, height, 1)
-        super(ImageMultiDiscrete, self).__init__(shape=(width, height, 1), dtype=np.int64, low=0, high=255) #
+        super(ImageMultiDiscrete, self).__init__(shape=(width, height, 1), dtype=dtype, low=0, high=255) #
         super(ImageMultiDiscrete, self).seed(seed=seed) #
 
     # def seed(self, seed=None):
@@ -214,21 +214,24 @@ def get_concatenated_image(self, multi_discrete_state,):
         #     concatenated_image.append(self.disjoint_states[i][multi_discrete_state[i]])
         concatenated_image = np.concatenate(tuple(concatenated_image), axis=0)
 
-        return concatenated_image[..., np.newaxis] # because Ray expects an image to have >=3 dims
+        return np.atleast_3d(concatenated_image) # because Ray expects an image to have >=3 dims
 
     # def get_multi_discrete_state(self,
 
     def sample(self):
         sss = np.array(self.state_space_sizes)
-        sampled = (self.np_random.random_sample(sss.shape) * sss).astype(np.int64) # Based on Gym's MultiDiscrete sampling
+        sampled = (self.np_random.random_sample(sss.shape) * sss).astype(self.dtype) # Based on Gym's MultiDiscrete sampling
         # if type(sampled) == int:
         #     sampled = [sampled]
         sampled = list(sampled)
 
         return self.get_concatenated_image(sampled)
 
     def __repr__(self):
-        return "ImageMultiDiscrete with multi-discrete space of shape: {} and images of resolution: {}".format(self.state_space_sizes, self.shape)
+        return "{} with multi-discrete space of shape: {} and "\
+                "images of resolution: {} and dtype: {}".format(self.__class__,\
+                self.state_space_sizes,\
+                self.shape, self.dtype)
 
     def contains(self, x):
         """
diff --git a/mdp_playground/spaces/test_image_continuous.py b/mdp_playground/spaces/test_image_continuous.py
@@ -0,0 +1,62 @@
+import unittest
+import numpy as np
+from mdp_playground.spaces.image_continuous import ImageContinuous
+from gym.spaces import Box
+# import PIL.ImageDraw as ImageDraw
+import PIL.Image as Image
+
+
+class TestImageContinuous(unittest.TestCase):
+
+    def test_image_continuous(self):
+        lows = 0.0
+        highs = 20.0
+        cs2 = Box(shape=(2,), low=lows, high=highs,)
+        cs4 = Box(shape=(4,), low=lows, high=highs,)
+
+        imc = ImageContinuous(cs2, width=400, height=400,)
+        pos = np.array([5.0, 7.0])
+        img1 = Image.fromarray(np.squeeze(imc.generate_image(pos)), 'RGB')
+        img1.show()
+
+        target = np.array([10, 10])
+        imc = ImageContinuous(cs2, target_point=target, width=400, height=400,)
+        img1 = Image.fromarray(np.squeeze(imc.generate_image(pos)), 'RGB')
+        img1.show()
+
+        # Terminal sub-spaces
+        lows = np.array([2., 4.])
+        highs = np.array([3., 6.])
+        cs2_term1 = Box(low=lows, high=highs,)
+        lows = np.array([12., 3.])
+        highs = np.array([13., 4.])
+        cs2_term2 = Box(low=lows, high=highs,)
+        term_spaces = [cs2_term1, cs2_term2]
+
+        target = np.array([10, 10])
+        imc = ImageContinuous(cs2, target_point=target, term_spaces=term_spaces,\
+                        width=400, height=400,)
+        pos = np.array([5.0, 7.0])
+        img1 = Image.fromarray(np.squeeze(imc.get_concatenated_image(pos)), 'RGB')
+        img1.show()
+
+
+        # Irrelevant features
+        target = np.array([10, 10])
+        imc = ImageContinuous(cs4, target_point=target, width=400, height=400,)
+        pos = np.array([5.0, 7.0, 10.0, 15.0])
+        img1 = Image.fromarray(np.squeeze(imc.get_concatenated_image(pos)), 'RGB')
+        img1.show()
+        # print(imc.get_concatenated_image(pos).shape)
+
+        # Random sample and __repr__
+        imc = ImageContinuous(cs4, target_point=target, width=400, height=400,)
+        print(imc)
+        img1 = Image.fromarray(np.squeeze(imc.sample()), 'RGB')
+        img1.show()
+
+
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/mdp_playground/spaces/test_image_multi_discrete.py b/mdp_playground/spaces/test_image_multi_discrete.py
@@ -1,6 +1,6 @@
 import unittest
 import numpy as np
-from gym.spaces.image_multi_discrete import ImageMultiDiscrete
+from mdp_playground.spaces.image_multi_discrete import ImageMultiDiscrete
 from gym.spaces import Discrete, MultiDiscrete
 # import gym
 # from gym.spaces import MultiDiscrete
@@ -13,6 +13,8 @@ class TestImageMultiDiscrete(unittest.TestCase):
 
     def test_image_multi_discrete(self):
         ds4 = Discrete(4)
+        ds4 = [ds4.n]
+        print(ds4)
         imd = ImageMultiDiscrete(ds4, transforms='shift')
         from PIL import Image
         # img1 = Image.fromarray(imd.disjoint_states[0][1], 'L')
diff --git a/test_mdp_playground.py b/test_mdp_playground.py